Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
95270eb
1 Parent(s): 4a1e3f9

Training in progress, step 510000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a329db70ea5526ba5e4b910d073864205b498f32a4378b384003610aada51d6
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c7cde519c11bec5ed8e21c1c5f7e7a48e4331db9100e67e0f7768dfb456674
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3a4d73b67517b389449be9b81a6d62f88071ffeb1fb6ad679e4c42b56b14bda
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd6d7bd0a49b23290ba71dd1b9be309e7cb7e756973affa570765d9e0327dcf1
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d512ffa1b18c6ccc8dac4806c6008b76bb8f78c31b60a4336ad6a2a9fa9bb7a3
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b70dfee257c642602f7c3f1ed43cef4aa5ccfe8fedec32ff54410f192e88eb6
3
+ size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f66cebabe552d21647073ceeabf71a9c5fddbc9e0c70066a6914d3a038a79677
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc166cba1eb0e6e74e3f3bd2046727896088467fe3b854b45c839137552ff680
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:572120ff5e1d57786cb947f3c52e750254c5a4ff2a5c06ef2608f45e6a4e60de
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:523dad95eba9c45397e0fcdf0c46383b4719d62bdd88758deb0f327662ac86d0
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed3efb56468deb71f34f2a6667b3f91c0deb4e0556b62db345c7c959c339450d
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de1cff2e14d92828be5901277d3f564e9608bb294b5c00feb6b3bc8739ef4af7
3
+ size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61639df917cea6bc1eea9e7a1f48d3f6c9acb9557d8752aa9847613f1b857ad8
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce6a9467a251e9cbea13fa7869db249fdcb8d7f75671c56b9051c9e63a855aaa
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 7.63510315024356,
5
- "global_step": 500000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3706,11 +3706,85 @@
3706
  "eval_samples_per_second": 907.298,
3707
  "eval_steps_per_second": 14.517,
3708
  "step": 500000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3709
  }
3710
  ],
3711
  "max_steps": 1000000,
3712
  "num_train_epochs": 16,
3713
- "total_flos": 3.505008452040316e+22,
3714
  "trial_name": null,
3715
  "trial_params": null
3716
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 7.787805213248431,
5
+ "global_step": 510000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3706
  "eval_samples_per_second": 907.298,
3707
  "eval_steps_per_second": 14.517,
3708
  "step": 500000
3709
+ },
3710
+ {
3711
+ "epoch": 7.65,
3712
+ "learning_rate": 8.55498278627369e-05,
3713
+ "loss": 0.2646,
3714
+ "step": 501000
3715
+ },
3716
+ {
3717
+ "epoch": 7.67,
3718
+ "learning_rate": 8.531904085038221e-05,
3719
+ "loss": 0.2646,
3720
+ "step": 502000
3721
+ },
3722
+ {
3723
+ "epoch": 7.68,
3724
+ "learning_rate": 8.508819566984897e-05,
3725
+ "loss": 0.2641,
3726
+ "step": 503000
3727
+ },
3728
+ {
3729
+ "epoch": 7.7,
3730
+ "learning_rate": 8.485729484562307e-05,
3731
+ "loss": 0.2641,
3732
+ "step": 504000
3733
+ },
3734
+ {
3735
+ "epoch": 7.71,
3736
+ "learning_rate": 8.462634090279895e-05,
3737
+ "loss": 0.264,
3738
+ "step": 505000
3739
+ },
3740
+ {
3741
+ "epoch": 7.71,
3742
+ "eval_runtime": 1.0129,
3743
+ "eval_samples_per_second": 987.309,
3744
+ "eval_steps_per_second": 15.797,
3745
+ "step": 505000
3746
+ },
3747
+ {
3748
+ "epoch": 7.73,
3749
+ "learning_rate": 8.439533636705194e-05,
3750
+ "loss": 0.2635,
3751
+ "step": 506000
3752
+ },
3753
+ {
3754
+ "epoch": 7.74,
3755
+ "learning_rate": 8.416428376461061e-05,
3756
+ "loss": 0.2644,
3757
+ "step": 507000
3758
+ },
3759
+ {
3760
+ "epoch": 7.76,
3761
+ "learning_rate": 8.393318562222916e-05,
3762
+ "loss": 0.2642,
3763
+ "step": 508000
3764
+ },
3765
+ {
3766
+ "epoch": 7.77,
3767
+ "learning_rate": 8.370204446715997e-05,
3768
+ "loss": 0.2638,
3769
+ "step": 509000
3770
+ },
3771
+ {
3772
+ "epoch": 7.79,
3773
+ "learning_rate": 8.347086282712556e-05,
3774
+ "loss": 0.2637,
3775
+ "step": 510000
3776
+ },
3777
+ {
3778
+ "epoch": 7.79,
3779
+ "eval_runtime": 1.1071,
3780
+ "eval_samples_per_second": 903.278,
3781
+ "eval_steps_per_second": 14.452,
3782
+ "step": 510000
3783
  }
3784
  ],
3785
  "max_steps": 1000000,
3786
  "num_train_epochs": 16,
3787
+ "total_flos": 3.575108713070663e+22,
3788
  "trial_name": null,
3789
  "trial_params": null
3790
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3a4d73b67517b389449be9b81a6d62f88071ffeb1fb6ad679e4c42b56b14bda
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd6d7bd0a49b23290ba71dd1b9be309e7cb7e756973affa570765d9e0327dcf1
3
  size 449471589