Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
dfc30ca
1 Parent(s): b72b22a

Training in progress, step 110000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db2e288361a09b4b7188ac62d2aadda977c3d294af8ad3f73e2b72bd0663ea87
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c948eebbc33dfa7163a265ead1f1a9361b0c30c12a12de00dcf340d40d2658b
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dfd008c5411020d58a84a813d4db30ca837b9cce0a2b859586eb276a2928563
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3496297d45c4ecf853137342e06ee76ffd7a454b5f8f23c88381de10d12213d2
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4f9af544e31603097b82ac1d9757b18d1e77cd9d3f5e0d82ff6f70151a0ec04
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adcae24276cfe7a6f029d01f999621482dc39224a9126d96b9666e8134968416
3
+ size 14439
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:80e543431b9b9286d502e9e435479120e37dfd67af853c03aa4e1515f6425d35
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50b86582c3ae12c705a7005fed2da8884791451301066581e22169aa8046a6bd
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52d6b11ee335cf1f946095db74d4fad452219b5271b7968de8a4d7e06234c4ee
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ea4115312e60b99085371b9865a77942fe890528298791f0e387803437d5ebb
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b705ae3e4d654b3daa3e7cb177baf9ea0f4c55d7b0f6bedb7d163c3dc6d902c
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9811453ee080e5df1835ce925467584d500ae5c97c544e104ff63747920507e0
3
+ size 14567
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ab0b752b3079dc9be868ddd61d4a48c6f227ceaa95b4267c4d5e0911b7baba7b
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4aabac21e516317a7b98a87a94ce8a8b7afae82a6e696839a4840e30fc5507ba
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.527020630048712,
5
- "global_step": 100000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -746,11 +746,85 @@
746
  "eval_samples_per_second": 995.424,
747
  "eval_steps_per_second": 15.927,
748
  "step": 100000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
749
  }
750
  ],
751
  "max_steps": 1000000,
752
  "num_train_epochs": 16,
753
- "total_flos": 7.010019532353227e+21,
754
  "trial_name": null,
755
  "trial_params": null
756
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.6797226930535831,
5
+ "global_step": 110000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
746
  "eval_samples_per_second": 995.424,
747
  "eval_steps_per_second": 15.927,
748
  "step": 100000
749
+ },
750
+ {
751
+ "epoch": 1.54,
752
+ "learning_rate": 0.00014900681246730852,
753
+ "loss": 0.3643,
754
+ "step": 101000
755
+ },
756
+ {
757
+ "epoch": 1.56,
758
+ "learning_rate": 0.00014896757904898125,
759
+ "loss": 0.3646,
760
+ "step": 102000
761
+ },
762
+ {
763
+ "epoch": 1.57,
764
+ "learning_rate": 0.00014892759141225904,
765
+ "loss": 0.3628,
766
+ "step": 103000
767
+ },
768
+ {
769
+ "epoch": 1.59,
770
+ "learning_rate": 0.00014888684999444035,
771
+ "loss": 0.3616,
772
+ "step": 104000
773
+ },
774
+ {
775
+ "epoch": 1.6,
776
+ "learning_rate": 0.00014884535524106675,
777
+ "loss": 0.3604,
778
+ "step": 105000
779
+ },
780
+ {
781
+ "epoch": 1.6,
782
+ "eval_runtime": 1.0499,
783
+ "eval_samples_per_second": 952.499,
784
+ "eval_steps_per_second": 15.24,
785
+ "step": 105000
786
+ },
787
+ {
788
+ "epoch": 1.62,
789
+ "learning_rate": 0.00014880310760591824,
790
+ "loss": 0.3594,
791
+ "step": 106000
792
+ },
793
+ {
794
+ "epoch": 1.63,
795
+ "learning_rate": 0.0001487601075510082,
796
+ "loss": 0.3597,
797
+ "step": 107000
798
+ },
799
+ {
800
+ "epoch": 1.65,
801
+ "learning_rate": 0.0001487163555465783,
802
+ "loss": 0.3583,
803
+ "step": 108000
804
+ },
805
+ {
806
+ "epoch": 1.66,
807
+ "learning_rate": 0.0001486718520710935,
808
+ "loss": 0.3583,
809
+ "step": 109000
810
+ },
811
+ {
812
+ "epoch": 1.68,
813
+ "learning_rate": 0.00014862659761123663,
814
+ "loss": 0.3558,
815
+ "step": 110000
816
+ },
817
+ {
818
+ "epoch": 1.68,
819
+ "eval_runtime": 1.0153,
820
+ "eval_samples_per_second": 984.91,
821
+ "eval_steps_per_second": 15.759,
822
+ "step": 110000
823
  }
824
  ],
825
  "max_steps": 1000000,
826
  "num_train_epochs": 16,
827
+ "total_flos": 7.711022142656698e+21,
828
  "trial_name": null,
829
  "trial_params": null
830
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6dfd008c5411020d58a84a813d4db30ca837b9cce0a2b859586eb276a2928563
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3496297d45c4ecf853137342e06ee76ffd7a454b5f8f23c88381de10d12213d2
3
  size 449471589