Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
b7e4f51
1 Parent(s): dfdd66e

Training in progress, step 440000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c4a14a4b300dc1a5da67108d934f51ece4d032d74a5b22ddb6baf522fdb8c1c
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f92e6cd0767ca59f1527b5967666a322afaf575c9af8775949662404da371092
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29a338d7e31f1ebb55d71826f0de824d2a1d8633cac67c074239e146a6c6bf2d
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:605e171de557600b4f9eab4567771d6f7b62053eb613a7b7ed22d56f357a201b
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10c521743622eed6f2a8ce22651670cd6f7fb24994288ac8323ec1f5d533e8a1
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4e4d0603158355ab30ed464162b9809f49d4b9fe387e337de95c9b6476ba9b3
3
+ size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dc65d4d1b61d6b6ec0b07de631a3fc7ef2baef1eecd8b2dd63afdc6d03ed25d
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:926ff1f312d9731049e2cfd0827e2934c1dc272e72548666a5980946912e0647
3
+ size 14439
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2003a4ffe1876cade3b569b7c4b3d4c928a46e1a7a6a797e8245fc18980679e5
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a69b501354d86430b18ce3c64120582562e9c52da9971d6a0efada8760b427f4
3
+ size 14439
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d19681008a4b6b5d37d79f13ad91bb5cfd25c6887d3949264aeea07e7705212
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89dedfbbaf4906adbb87599ce42dab2b3412c2f3eed1c918df1f52570f878203
3
+ size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1c41e7c1f83dca8045fba481a590c3c5a6ca39c080efa3c795ba2e0db9ab191b
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aa5fdd1e270251efa6239627ae6af3a9eb85be35af9f4cca7399ee33001083c
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 6.566188709209461,
5
- "global_step": 430000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3188,11 +3188,85 @@
3188
  "eval_samples_per_second": 910.508,
3189
  "eval_steps_per_second": 14.568,
3190
  "step": 430000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3191
  }
3192
  ],
3193
  "max_steps": 1000000,
3194
  "num_train_epochs": 16,
3195
- "total_flos": 3.0143072818960347e+22,
3196
  "trial_name": null,
3197
  "trial_params": null
3198
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.7188907722143325,
5
+ "global_step": 440000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3188
  "eval_samples_per_second": 910.508,
3189
  "eval_steps_per_second": 14.568,
3190
  "step": 430000
3191
+ },
3192
+ {
3193
+ "epoch": 6.58,
3194
+ "learning_rate": 0.00010141091567565561,
3195
+ "loss": 0.2727,
3196
+ "step": 431000
3197
+ },
3198
+ {
3199
+ "epoch": 6.6,
3200
+ "learning_rate": 0.00010119040759872142,
3201
+ "loss": 0.2725,
3202
+ "step": 432000
3203
+ },
3204
+ {
3205
+ "epoch": 6.61,
3206
+ "learning_rate": 0.00010096966778688472,
3207
+ "loss": 0.2721,
3208
+ "step": 433000
3209
+ },
3210
+ {
3211
+ "epoch": 6.63,
3212
+ "learning_rate": 0.00010074869865412074,
3213
+ "loss": 0.272,
3214
+ "step": 434000
3215
+ },
3216
+ {
3217
+ "epoch": 6.64,
3218
+ "learning_rate": 0.00010052750261691254,
3219
+ "loss": 0.2721,
3220
+ "step": 435000
3221
+ },
3222
+ {
3223
+ "epoch": 6.64,
3224
+ "eval_runtime": 0.9895,
3225
+ "eval_samples_per_second": 1010.612,
3226
+ "eval_steps_per_second": 16.17,
3227
+ "step": 435000
3228
+ },
3229
+ {
3230
+ "epoch": 6.66,
3231
+ "learning_rate": 0.0001003060820942245,
3232
+ "loss": 0.2716,
3233
+ "step": 436000
3234
+ },
3235
+ {
3236
+ "epoch": 6.67,
3237
+ "learning_rate": 0.00010008443950747599,
3238
+ "loss": 0.2716,
3239
+ "step": 437000
3240
+ },
3241
+ {
3242
+ "epoch": 6.69,
3243
+ "learning_rate": 9.986257728051483e-05,
3244
+ "loss": 0.2717,
3245
+ "step": 438000
3246
+ },
3247
+ {
3248
+ "epoch": 6.7,
3249
+ "learning_rate": 9.964049783959082e-05,
3250
+ "loss": 0.2716,
3251
+ "step": 439000
3252
+ },
3253
+ {
3254
+ "epoch": 6.72,
3255
+ "learning_rate": 9.94182036133291e-05,
3256
+ "loss": 0.2715,
3257
+ "step": 440000
3258
+ },
3259
+ {
3260
+ "epoch": 6.72,
3261
+ "eval_runtime": 1.0245,
3262
+ "eval_samples_per_second": 976.131,
3263
+ "eval_steps_per_second": 15.618,
3264
+ "step": 440000
3265
  }
3266
  ],
3267
  "max_steps": 1000000,
3268
  "num_train_epochs": 16,
3269
+ "total_flos": 3.084407542926382e+22,
3270
  "trial_name": null,
3271
  "trial_params": null
3272
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29a338d7e31f1ebb55d71826f0de824d2a1d8633cac67c074239e146a6c6bf2d
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:605e171de557600b4f9eab4567771d6f7b62053eb613a7b7ed22d56f357a201b
3
  size 449471589