Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
0342214
1 Parent(s): 9b34815

Training in progress, step 320000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b00071efc84beb2feace3b5a3f0a50851e6aef7cfc9f54978cffaf5df2df0e7
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e953bb14c52ac73828ddbb8d0fdec2f5d345e3cbc51fce0abb2a9e0782d8fb45
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7e2ee92a6eaf05a81d8cc01dee92eda2af9b205d2ac738942206a8dc6fa3a0e
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebbb0a403c4c85850b5f1bad1d089cdec8ce35c071f9b4d707f0145c3de24b2e
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa0bf92a765d09c7474a24e0b91454931a94402222241ea8b1d6ef7d1cfb2a2f
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15759c491e0cbc3c20a789defaa3eb9b1ba5f51f160318f99e2a7896f2394a59
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7f1efcee6a815bf5e7abad62d9857979801ac6926e6361e60063a1830c0e0cf
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7549533ede2b1dd6fe53e5571a6126478875eb81cddb6c662ba0261be0e9f079
3
+ size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e56ee00cae3dff0125b532f391da7e095ad5ffe308a7da8b824c5f69e3852d28
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:17b33604be61df5ac96216c3e2908cb72d7bc7445f1fbb6123710e746f63011f
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:063d140296abe43f5c05bc7e1492ad16b8cd4d6e4e44bfa11ee5374ad0035817
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ecf67d692ebf3eeab712f96e8bcf2b206bea3bf44b342d23dd61fb929784bb0
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:510bbb6396dcecf907e43c584a6f575f85c197777553938b74c3d9882298be6b
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e51637100435f199d054651c862159e9a427229daea6570b6d23739f5a17de3
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.733763953151007,
5
- "global_step": 310000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2300,11 +2300,85 @@
2300
  "eval_samples_per_second": 954.11,
2301
  "eval_steps_per_second": 15.266,
2302
  "step": 310000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2303
  }
2304
  ],
2305
  "max_steps": 1000000,
2306
  "num_train_epochs": 16,
2307
- "total_flos": 2.1731054636681665e+22,
2308
  "trial_name": null,
2309
  "trial_params": null
2310
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.886466016155878,
5
+ "global_step": 320000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2300
  "eval_samples_per_second": 954.11,
2301
  "eval_steps_per_second": 15.266,
2302
  "step": 310000
2303
+ },
2304
+ {
2305
+ "epoch": 4.75,
2306
+ "learning_rate": 0.0001255053536328589,
2307
+ "loss": 0.2887,
2308
+ "step": 311000
2309
+ },
2310
+ {
2311
+ "epoch": 4.76,
2312
+ "learning_rate": 0.0001253292063197693,
2313
+ "loss": 0.2887,
2314
+ "step": 312000
2315
+ },
2316
+ {
2317
+ "epoch": 4.78,
2318
+ "learning_rate": 0.0001251525632937418,
2319
+ "loss": 0.2886,
2320
+ "step": 313000
2321
+ },
2322
+ {
2323
+ "epoch": 4.79,
2324
+ "learning_rate": 0.00012497542648651615,
2325
+ "loss": 0.2887,
2326
+ "step": 314000
2327
+ },
2328
+ {
2329
+ "epoch": 4.81,
2330
+ "learning_rate": 0.00012479779783523216,
2331
+ "loss": 0.2883,
2332
+ "step": 315000
2333
+ },
2334
+ {
2335
+ "epoch": 4.81,
2336
+ "eval_runtime": 1.0333,
2337
+ "eval_samples_per_second": 967.804,
2338
+ "eval_steps_per_second": 15.485,
2339
+ "step": 315000
2340
+ },
2341
+ {
2342
+ "epoch": 4.83,
2343
+ "learning_rate": 0.00012461967928240828,
2344
+ "loss": 0.2883,
2345
+ "step": 316000
2346
+ },
2347
+ {
2348
+ "epoch": 4.84,
2349
+ "learning_rate": 0.00012444107277592047,
2350
+ "loss": 0.2877,
2351
+ "step": 317000
2352
+ },
2353
+ {
2354
+ "epoch": 4.86,
2355
+ "learning_rate": 0.0001242619802689809,
2356
+ "loss": 0.2879,
2357
+ "step": 318000
2358
+ },
2359
+ {
2360
+ "epoch": 4.87,
2361
+ "learning_rate": 0.00012408240372011647,
2362
+ "loss": 0.2876,
2363
+ "step": 319000
2364
+ },
2365
+ {
2366
+ "epoch": 4.89,
2367
+ "learning_rate": 0.0001239023450931476,
2368
+ "loss": 0.2874,
2369
+ "step": 320000
2370
+ },
2371
+ {
2372
+ "epoch": 4.89,
2373
+ "eval_runtime": 1.04,
2374
+ "eval_samples_per_second": 961.537,
2375
+ "eval_steps_per_second": 15.385,
2376
+ "step": 320000
2377
  }
2378
  ],
2379
  "max_steps": 1000000,
2380
  "num_train_epochs": 16,
2381
+ "total_flos": 2.2432057246985136e+22,
2382
  "trial_name": null,
2383
  "trial_params": null
2384
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7e2ee92a6eaf05a81d8cc01dee92eda2af9b205d2ac738942206a8dc6fa3a0e
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebbb0a403c4c85850b5f1bad1d089cdec8ce35c071f9b4d707f0145c3de24b2e
3
  size 449471589