Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
c75c2d3
1 Parent(s): 946570d

Training in progress, step 640000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8d82e2070f1b6c3e7ba3ac4e05d24d0c3c44e21fea62b60f30dbcd4b8aea7947
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c444c75d0337de46e35f539ad919e0e13abb76dfe8d15c375255f6a83fa8fd2
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aa845416abb07e55de755c0df750468c782329996a5b84f0336b895c9a2baa1
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5808a95cf4864d9e7dd396fa3d5d75f6fe69b93fbc2376d586a3a7fc3b0fe04
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4acbb51e13aa598f4ce3e939d773ff547815a4a8c85e2bd41643e066b97a863b
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aaf518826c7b02349e0c4043ecb7a38ebc1a14f60809955f00a7944ae21e6fc
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:798c603bd32aeea05803afc8a5c1b8f53a6193b4dd4a2b5a26aa63e0065ce70e
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcb6ee46cb325ce6d5d0f15d240a67578f4710009ebcab3be0d17117038d01fa
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0fb0d506dd83556c6bb13f32358c5188773f715722e0fae2529869d20b06680
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7121d5ba757842882faa79dcd7ac54d5b1c2ec66868fe528ff6cebaa506df816
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa6390e57fdd76fefb80f0c1ccc262a99cb2e588a24afb098b63de6015cd6400
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6083d2cad6c63a2b0e7d04c706615465f15ee7e67189e761029a05d0b2f204c9
3
+ size 14439
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:445023bf71af0013aa9e5796238ea2c1da2dcfc1e0064784bf2e5fc75bdc80c6
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ba925316c6e59686c34db192a6703d2b94be7f6c9b908cf313be2f93b23828d
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 9.620229969306886,
5
- "global_step": 630000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -4668,11 +4668,85 @@
4668
  "eval_samples_per_second": 836.899,
4669
  "eval_steps_per_second": 13.39,
4670
  "step": 630000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4671
  }
4672
  ],
4673
  "max_steps": 1000000,
4674
  "num_train_epochs": 16,
4675
- "total_flos": 4.416310531298531e+22,
4676
  "trial_name": null,
4677
  "trial_params": null
4678
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 9.772932032311756,
5
+ "global_step": 640000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
4668
  "eval_samples_per_second": 836.899,
4669
  "eval_steps_per_second": 13.39,
4670
  "step": 630000
4671
+ },
4672
+ {
4673
+ "epoch": 9.64,
4674
+ "learning_rate": 5.596193787225254e-05,
4675
+ "loss": 0.2514,
4676
+ "step": 631000
4677
+ },
4678
+ {
4679
+ "epoch": 9.65,
4680
+ "learning_rate": 5.574466083181624e-05,
4681
+ "loss": 0.2512,
4682
+ "step": 632000
4683
+ },
4684
+ {
4685
+ "epoch": 9.67,
4686
+ "learning_rate": 5.552764904388305e-05,
4687
+ "loss": 0.2511,
4688
+ "step": 633000
4689
+ },
4690
+ {
4691
+ "epoch": 9.68,
4692
+ "learning_rate": 5.5310904881659116e-05,
4693
+ "loss": 0.2511,
4694
+ "step": 634000
4695
+ },
4696
+ {
4697
+ "epoch": 9.7,
4698
+ "learning_rate": 5.5094430715423835e-05,
4699
+ "loss": 0.2509,
4700
+ "step": 635000
4701
+ },
4702
+ {
4703
+ "epoch": 9.7,
4704
+ "eval_runtime": 1.0102,
4705
+ "eval_samples_per_second": 989.889,
4706
+ "eval_steps_per_second": 15.838,
4707
+ "step": 635000
4708
+ },
4709
+ {
4710
+ "epoch": 9.71,
4711
+ "learning_rate": 5.487822891250406e-05,
4712
+ "loss": 0.2511,
4713
+ "step": 636000
4714
+ },
4715
+ {
4716
+ "epoch": 9.73,
4717
+ "learning_rate": 5.4662301837247985e-05,
4718
+ "loss": 0.2508,
4719
+ "step": 637000
4720
+ },
4721
+ {
4722
+ "epoch": 9.74,
4723
+ "learning_rate": 5.4446651850999604e-05,
4724
+ "loss": 0.2506,
4725
+ "step": 638000
4726
+ },
4727
+ {
4728
+ "epoch": 9.76,
4729
+ "learning_rate": 5.4231281312072544e-05,
4730
+ "loss": 0.2505,
4731
+ "step": 639000
4732
+ },
4733
+ {
4734
+ "epoch": 9.77,
4735
+ "learning_rate": 5.401619257572453e-05,
4736
+ "loss": 0.2502,
4737
+ "step": 640000
4738
+ },
4739
+ {
4740
+ "epoch": 9.77,
4741
+ "eval_runtime": 1.0069,
4742
+ "eval_samples_per_second": 993.184,
4743
+ "eval_steps_per_second": 15.891,
4744
+ "step": 640000
4745
  }
4746
  ],
4747
  "max_steps": 1000000,
4748
  "num_train_epochs": 16,
4749
+ "total_flos": 4.4864107923288785e+22,
4750
  "trial_name": null,
4751
  "trial_params": null
4752
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2aa845416abb07e55de755c0df750468c782329996a5b84f0336b895c9a2baa1
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5808a95cf4864d9e7dd396fa3d5d75f6fe69b93fbc2376d586a3a7fc3b0fe04
3
  size 449471589