Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
7d9d27c
1 Parent(s): d64ffb3

Training in progress, step 470000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e074c33dcba955530635f7c301cc0616d35e94c4d9e25f501a0d9edd512370f3
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48d4808dde71eac80e04b5355e71b14ceb9b5e0ae529d95a233b51272607ab83
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e2e3c76b0bd22486ffeb7f1582064821337785eddce5493639f753ea7af7c21
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7103687c38405c622f568188c0f14e1563ef023c455f4c1710827b01ab80bb17
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f07bf259da4db58c67f5752e41be50bd05dbfaf1912a8b5878788f3ede910eb7
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4e056df33e676753147b05c71aab5efb8704dfd8ee13e008fdf53d8cdac44b2
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e069aee1aca48a60052a1c66c7d1551fec7d9dcab99912ac030e1863b14f6a1
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7049055dea9713813a526e48cc1a4819519bd8bf226d421b09446678fec8fd94
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:642ba2efc3dad359eda3b33bb6c5d67fffdc0e921c5ed6b47ef80068231cbd4a
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae399cb1dd5e413a3579163a8c5c2dc1f7fefe685aeb37d572263aef6a0f1ce1
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5475a56a8e58f3a6d30456ecb3d60c907f9c5dd05e43f39a9dbfefa6d303c24c
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0032134f185d3f5485217ef8125c850bc4af9658f5890ff772fcbabf723e2b09
3
+ size 14567
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d470fe106a7d346e8d83a1e5754bc519572ca0d497bb4adce56ffd8f58de945f
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f611622a5002fa681af11a66fadbdf979555ccde290d546f60b9105024e7e63
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 7.024294898224075,
5
- "global_step": 460000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3410,11 +3410,85 @@
3410
  "eval_samples_per_second": 978.034,
3411
  "eval_steps_per_second": 15.649,
3412
  "step": 460000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3413
  }
3414
  ],
3415
  "max_steps": 1000000,
3416
  "num_train_epochs": 16,
3417
- "total_flos": 3.2246074079189274e+22,
3418
  "trial_name": null,
3419
  "trial_params": null
3420
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 7.176996961228946,
5
+ "global_step": 470000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3410
  "eval_samples_per_second": 978.034,
3411
  "eval_steps_per_second": 15.649,
3412
  "step": 460000
3413
+ },
3414
+ {
3415
+ "epoch": 7.04,
3416
+ "learning_rate": 9.47047343697216e-05,
3417
+ "loss": 0.269,
3418
+ "step": 461000
3419
+ },
3420
+ {
3421
+ "epoch": 7.05,
3422
+ "learning_rate": 9.447833377876176e-05,
3423
+ "loss": 0.269,
3424
+ "step": 462000
3425
+ },
3426
+ {
3427
+ "epoch": 7.07,
3428
+ "learning_rate": 9.425177485506336e-05,
3429
+ "loss": 0.2688,
3430
+ "step": 463000
3431
+ },
3432
+ {
3433
+ "epoch": 7.09,
3434
+ "learning_rate": 9.402506007623848e-05,
3435
+ "loss": 0.269,
3436
+ "step": 464000
3437
+ },
3438
+ {
3439
+ "epoch": 7.1,
3440
+ "learning_rate": 9.379819192160362e-05,
3441
+ "loss": 0.2692,
3442
+ "step": 465000
3443
+ },
3444
+ {
3445
+ "epoch": 7.1,
3446
+ "eval_runtime": 1.1401,
3447
+ "eval_samples_per_second": 877.142,
3448
+ "eval_steps_per_second": 14.034,
3449
+ "step": 465000
3450
+ },
3451
+ {
3452
+ "epoch": 7.12,
3453
+ "learning_rate": 9.357117287215258e-05,
3454
+ "loss": 0.2682,
3455
+ "step": 466000
3456
+ },
3457
+ {
3458
+ "epoch": 7.13,
3459
+ "learning_rate": 9.334400541052928e-05,
3460
+ "loss": 0.2683,
3461
+ "step": 467000
3462
+ },
3463
+ {
3464
+ "epoch": 7.15,
3465
+ "learning_rate": 9.311669202100073e-05,
3466
+ "loss": 0.2693,
3467
+ "step": 468000
3468
+ },
3469
+ {
3470
+ "epoch": 7.16,
3471
+ "learning_rate": 9.288923518942968e-05,
3472
+ "loss": 0.2683,
3473
+ "step": 469000
3474
+ },
3475
+ {
3476
+ "epoch": 7.18,
3477
+ "learning_rate": 9.26616374032477e-05,
3478
+ "loss": 0.2677,
3479
+ "step": 470000
3480
+ },
3481
+ {
3482
+ "epoch": 7.18,
3483
+ "eval_runtime": 0.8954,
3484
+ "eval_samples_per_second": 1116.774,
3485
+ "eval_steps_per_second": 17.868,
3486
+ "step": 470000
3487
  }
3488
  ],
3489
  "max_steps": 1000000,
3490
  "num_train_epochs": 16,
3491
+ "total_flos": 3.2947076689492745e+22,
3492
  "trial_name": null,
3493
  "trial_params": null
3494
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8e2e3c76b0bd22486ffeb7f1582064821337785eddce5493639f753ea7af7c21
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7103687c38405c622f568188c0f14e1563ef023c455f4c1710827b01ab80bb17
3
  size 449471589