Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
1577352
1 Parent(s): b7e4f51

Training in progress, step 450000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f92e6cd0767ca59f1527b5967666a322afaf575c9af8775949662404da371092
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30290edc8628fd3c3ef18b3c5aeed7f069b37f58cee15ba21ffc0026c01c3730
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:605e171de557600b4f9eab4567771d6f7b62053eb613a7b7ed22d56f357a201b
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd9bd4abec55ec3aff5c6a63e004f193b84327f4dea19bd4c7a418c248e58ed7
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4e4d0603158355ab30ed464162b9809f49d4b9fe387e337de95c9b6476ba9b3
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33d4cd7454368d736d737996ed03879986986a143829539c951d1987c1b5985b
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:926ff1f312d9731049e2cfd0827e2934c1dc272e72548666a5980946912e0647
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7336b286bfd4476ee4aa817ed5f237f90f8c52aba8afeb7d24431d41ce3a20dc
3
+ size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a69b501354d86430b18ce3c64120582562e9c52da9971d6a0efada8760b427f4
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d3e44169554700b12ce1323e27998dd02eb610802144e6e40dc2e6668fa701b
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89dedfbbaf4906adbb87599ce42dab2b3412c2f3eed1c918df1f52570f878203
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b37e67e1cf58930910192e85abdd9cbaabe8e6e23dc6148e7d6f7fcf570a387a
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0aa5fdd1e270251efa6239627ae6af3a9eb85be35af9f4cca7399ee33001083c
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ca5b8ec583e6ebb62b2f3066d6bca2c46b8614e9cfbd4e5e7bfdb3a9d7a2d86
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 6.7188907722143325,
5
- "global_step": 440000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3262,11 +3262,85 @@
3262
  "eval_samples_per_second": 976.131,
3263
  "eval_steps_per_second": 15.618,
3264
  "step": 440000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3265
  }
3266
  ],
3267
  "max_steps": 1000000,
3268
  "num_train_epochs": 16,
3269
- "total_flos": 3.084407542926382e+22,
3270
  "trial_name": null,
3271
  "trial_params": null
3272
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.871592835219204,
5
+ "global_step": 450000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3262
  "eval_samples_per_second": 976.131,
3263
  "eval_steps_per_second": 15.618,
3264
  "step": 440000
3265
+ },
3266
+ {
3267
+ "epoch": 6.73,
3268
+ "learning_rate": 9.919569703270376e-05,
3269
+ "loss": 0.2716,
3270
+ "step": 441000
3271
+ },
3272
+ {
3273
+ "epoch": 6.75,
3274
+ "learning_rate": 9.89729805310111e-05,
3275
+ "loss": 0.2711,
3276
+ "step": 442000
3277
+ },
3278
+ {
3279
+ "epoch": 6.76,
3280
+ "learning_rate": 9.875005654384307e-05,
3281
+ "loss": 0.2712,
3282
+ "step": 443000
3283
+ },
3284
+ {
3285
+ "epoch": 6.78,
3286
+ "learning_rate": 9.852692750906071e-05,
3287
+ "loss": 0.2717,
3288
+ "step": 444000
3289
+ },
3290
+ {
3291
+ "epoch": 6.8,
3292
+ "learning_rate": 9.830359586676737e-05,
3293
+ "loss": 0.2722,
3294
+ "step": 445000
3295
+ },
3296
+ {
3297
+ "epoch": 6.8,
3298
+ "eval_runtime": 1.1145,
3299
+ "eval_samples_per_second": 897.295,
3300
+ "eval_steps_per_second": 14.357,
3301
+ "step": 445000
3302
+ },
3303
+ {
3304
+ "epoch": 6.81,
3305
+ "learning_rate": 9.808006405928215e-05,
3306
+ "loss": 0.2703,
3307
+ "step": 446000
3308
+ },
3309
+ {
3310
+ "epoch": 6.83,
3311
+ "learning_rate": 9.785633453111306e-05,
3312
+ "loss": 0.2705,
3313
+ "step": 447000
3314
+ },
3315
+ {
3316
+ "epoch": 6.84,
3317
+ "learning_rate": 9.763240972893037e-05,
3318
+ "loss": 0.27,
3319
+ "step": 448000
3320
+ },
3321
+ {
3322
+ "epoch": 6.86,
3323
+ "learning_rate": 9.740829210153984e-05,
3324
+ "loss": 0.2703,
3325
+ "step": 449000
3326
+ },
3327
+ {
3328
+ "epoch": 6.87,
3329
+ "learning_rate": 9.718398409985593e-05,
3330
+ "loss": 0.27,
3331
+ "step": 450000
3332
+ },
3333
+ {
3334
+ "epoch": 6.87,
3335
+ "eval_runtime": 0.9938,
3336
+ "eval_samples_per_second": 1006.215,
3337
+ "eval_steps_per_second": 16.099,
3338
+ "step": 450000
3339
  }
3340
  ],
3341
  "max_steps": 1000000,
3342
  "num_train_epochs": 16,
3343
+ "total_flos": 3.154507803956729e+22,
3344
  "trial_name": null,
3345
  "trial_params": null
3346
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:605e171de557600b4f9eab4567771d6f7b62053eb613a7b7ed22d56f357a201b
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd9bd4abec55ec3aff5c6a63e004f193b84327f4dea19bd4c7a418c248e58ed7
3
  size 449471589