Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
5602ad9
1 Parent(s): 8675274

Training in progress, step 340000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7d2a5e73283aa1880b29f29feb6316701d271842328e195271c3e399e6c920a
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f848b004ca69d971cd5024827329eb728808850f3ba285aae6ae2d66c5e9a1ea
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fb067e8d99d964806b68ae99e0f39bdecb3dd4f00cbe7958a115e1392dffcc7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bfba4eea74dece360d73bbeb68171b0f24c78184fc1168b69bc18ed84fe5243
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:623a6385c6947219614a206f325f0d5bbe602621d1fd3e48972b7fdd72be25d2
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20c5b304cccca8b5844ddfec128e44995bacab68346ff44d01e8476a83259d32
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:02ac5973a9776fb5558d0d5471ce91f9f5f08200895aa832ab0411732da0bb62
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a6026e8cbd4826fee12ad344c0bb2e47d863082fccddfed4801c66cbc3305df
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbe8a6d91f7528a2132dc105f5a011209849ce078b5ae84cd752340614efc89b
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:276a39a4e5fc9bbf2fc7156d49a68ce7b2b8c02aa8d52e98747eb94a987f3191
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57da30fd98664b01593e067ac432f0638ebe9389fdcddf47146e4e5d78f9b45b
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e64783857a8ded45f594a9d4d98ef3bd8c1d156f9923bb0bef61858daa470a8e
3
+ size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:41ab9ece5cf2fe3d99e3bf57fddd4aebe29db0bd41b88067fc2fa8ae9ef5bedb
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e61c24f771644e6cd7fccf329b7b1a8621bd89eecc91f4043864ce60f81c96b6
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.039168079160749,
5
- "global_step": 330000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2448,11 +2448,85 @@
2448
  "eval_samples_per_second": 883.862,
2449
  "eval_steps_per_second": 14.142,
2450
  "step": 330000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2451
  }
2452
  ],
2453
  "max_steps": 1000000,
2454
  "num_train_epochs": 16,
2455
- "total_flos": 2.313305328660712e+22,
2456
  "trial_name": null,
2457
  "trial_params": null
2458
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.19187014216562,
5
+ "global_step": 340000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2448
  "eval_samples_per_second": 883.862,
2449
  "eval_steps_per_second": 14.142,
2450
  "step": 330000
2451
+ },
2452
+ {
2453
+ "epoch": 5.05,
2454
+ "learning_rate": 0.00012189044992813972,
2455
+ "loss": 0.2858,
2456
+ "step": 331000
2457
+ },
2458
+ {
2459
+ "epoch": 5.07,
2460
+ "learning_rate": 0.0001217047614392187,
2461
+ "loss": 0.2857,
2462
+ "step": 332000
2463
+ },
2464
+ {
2465
+ "epoch": 5.08,
2466
+ "learning_rate": 0.00012151861687370828,
2467
+ "loss": 0.2857,
2468
+ "step": 333000
2469
+ },
2470
+ {
2471
+ "epoch": 5.1,
2472
+ "learning_rate": 0.00012133201826725558,
2473
+ "loss": 0.2852,
2474
+ "step": 334000
2475
+ },
2476
+ {
2477
+ "epoch": 5.12,
2478
+ "learning_rate": 0.0001211449676604731,
2479
+ "loss": 0.2853,
2480
+ "step": 335000
2481
+ },
2482
+ {
2483
+ "epoch": 5.12,
2484
+ "eval_runtime": 1.3419,
2485
+ "eval_samples_per_second": 745.216,
2486
+ "eval_steps_per_second": 11.923,
2487
+ "step": 335000
2488
+ },
2489
+ {
2490
+ "epoch": 5.13,
2491
+ "learning_rate": 0.00012095746709891632,
2492
+ "loss": 0.2852,
2493
+ "step": 336000
2494
+ },
2495
+ {
2496
+ "epoch": 5.15,
2497
+ "learning_rate": 0.00012076951863306127,
2498
+ "loss": 0.285,
2499
+ "step": 337000
2500
+ },
2501
+ {
2502
+ "epoch": 5.16,
2503
+ "learning_rate": 0.0001205811243182823,
2504
+ "loss": 0.2848,
2505
+ "step": 338000
2506
+ },
2507
+ {
2508
+ "epoch": 5.18,
2509
+ "learning_rate": 0.00012039228621482949,
2510
+ "loss": 0.2858,
2511
+ "step": 339000
2512
+ },
2513
+ {
2514
+ "epoch": 5.19,
2515
+ "learning_rate": 0.00012020300638780604,
2516
+ "loss": 0.2845,
2517
+ "step": 340000
2518
+ },
2519
+ {
2520
+ "epoch": 5.19,
2521
+ "eval_runtime": 1.2559,
2522
+ "eval_samples_per_second": 796.26,
2523
+ "eval_steps_per_second": 12.74,
2524
+ "step": 340000
2525
  }
2526
  ],
2527
  "max_steps": 1000000,
2528
  "num_train_epochs": 16,
2529
+ "total_flos": 2.383405589691059e+22,
2530
  "trial_name": null,
2531
  "trial_params": null
2532
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4fb067e8d99d964806b68ae99e0f39bdecb3dd4f00cbe7958a115e1392dffcc7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5bfba4eea74dece360d73bbeb68171b0f24c78184fc1168b69bc18ed84fe5243
3
  size 449471589