Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
2bf164d
1 Parent(s): e76e0b0

Training in progress, step 170000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51c4479b7100b24acffdfd7fb1cff497645cac828edc9bce49ad39669a19e6f1
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f9a70132918b6ab165a91d577d712613356dca52075d5c7c05f34314005b476
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f45b8970c2fcdae44788b5d4ade86d7949295115594ab3b0d456c282cadcd002
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e4608999d97a58a30e39361b70b419f5aef3e2535ed3ca55c26e98dfa526a2
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02a1d97b2752462543b92ffd0f23922ddd8ffff9e6ba2aaf2b57366a0cea0714
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef92b44093f62f1441b173acbe3fd1139e94c5c223ed6a54381a9d3cb2f5c022
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29849d211b595c5ac9c137dcd37e20da1964e185621f9086f1491a26e0f460bc
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:161efcaf59347006251947d35ba8e577aead293e95ee199281ec31fb424a8671
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e99c0c1e436962d7938fd416d17b1f2b444137c2e5f765032e46157e9b60a3ea
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5b4db0eb85867b5e22ab5799a8329f0f5930ac32c5205c1b81fbef9bb0ad0ab
3
+ size 14439
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00c80b4bceef61474bcae1ecae0d1e95d0713b469a0fdc8873f2259acce5bd7e
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed9a9a05da89d28b0f8404cc60f79e71945e2a52c47886846fb03eae29b9b7e7
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:09b0f5af299b689f18c326dad86c4c4c3f628480672d22f22ec90ae66ce6a4f1
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e6e6dbb6845e268a54a5a558c86918603b34b6bae9a32a1510a924b34f03635
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 2.443233008077939,
5
- "global_step": 160000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1190,11 +1190,85 @@
1190
  "eval_samples_per_second": 980.452,
1191
  "eval_steps_per_second": 15.687,
1192
  "step": 160000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1193
  }
1194
  ],
1195
  "max_steps": 1000000,
1196
  "num_train_epochs": 16,
1197
- "total_flos": 1.1216028623492568e+22,
1198
  "trial_name": null,
1199
  "trial_params": null
1200
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 2.59593507108281,
5
+ "global_step": 170000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1190
  "eval_samples_per_second": 980.452,
1191
  "eval_steps_per_second": 15.687,
1192
  "step": 160000
1193
+ },
1194
+ {
1195
+ "epoch": 2.46,
1196
+ "learning_rate": 0.00014533679374921493,
1197
+ "loss": 0.3259,
1198
+ "step": 161000
1199
+ },
1200
+ {
1201
+ "epoch": 2.47,
1202
+ "learning_rate": 0.00014525336046375905,
1203
+ "loss": 0.3254,
1204
+ "step": 162000
1205
+ },
1206
+ {
1207
+ "epoch": 2.49,
1208
+ "learning_rate": 0.00014516921357800766,
1209
+ "loss": 0.3251,
1210
+ "step": 163000
1211
+ },
1212
+ {
1213
+ "epoch": 2.5,
1214
+ "learning_rate": 0.00014508435401217759,
1215
+ "loss": 0.3244,
1216
+ "step": 164000
1217
+ },
1218
+ {
1219
+ "epoch": 2.52,
1220
+ "learning_rate": 0.00014499878269427948,
1221
+ "loss": 0.3243,
1222
+ "step": 165000
1223
+ },
1224
+ {
1225
+ "epoch": 2.52,
1226
+ "eval_runtime": 1.0655,
1227
+ "eval_samples_per_second": 938.486,
1228
+ "eval_steps_per_second": 15.016,
1229
+ "step": 165000
1230
+ },
1231
+ {
1232
+ "epoch": 2.53,
1233
+ "learning_rate": 0.00014491250056010758,
1234
+ "loss": 0.3236,
1235
+ "step": 166000
1236
+ },
1237
+ {
1238
+ "epoch": 2.55,
1239
+ "learning_rate": 0.00014482550855322943,
1240
+ "loss": 0.3233,
1241
+ "step": 167000
1242
+ },
1243
+ {
1244
+ "epoch": 2.57,
1245
+ "learning_rate": 0.0001447378076249757,
1246
+ "loss": 0.3231,
1247
+ "step": 168000
1248
+ },
1249
+ {
1250
+ "epoch": 2.58,
1251
+ "learning_rate": 0.00014464939873442973,
1252
+ "loss": 0.3228,
1253
+ "step": 169000
1254
+ },
1255
+ {
1256
+ "epoch": 2.6,
1257
+ "learning_rate": 0.00014456028284841693,
1258
+ "loss": 0.3221,
1259
+ "step": 170000
1260
+ },
1261
+ {
1262
+ "epoch": 2.6,
1263
+ "eval_runtime": 1.1756,
1264
+ "eval_samples_per_second": 850.656,
1265
+ "eval_steps_per_second": 13.611,
1266
+ "step": 170000
1267
  }
1268
  ],
1269
  "max_steps": 1000000,
1270
  "num_train_epochs": 16,
1271
+ "total_flos": 1.191703123379604e+22,
1272
  "trial_name": null,
1273
  "trial_params": null
1274
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f45b8970c2fcdae44788b5d4ade86d7949295115594ab3b0d456c282cadcd002
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04e4608999d97a58a30e39361b70b419f5aef3e2535ed3ca55c26e98dfa526a2
3
  size 449471589