Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
7cd08af
1 Parent(s): cdd8c30

Training in progress, step 390000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c700adab32c9c77d19e150bd97404af77c8ea4f249d7d8819f10ecd29a7599aa
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e4182e3962d3a040ab734b61da56d604a525bd5f2d61cf2e3f5b36f5f0ee5bc
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b70ffcb599d0cbcc5aa0449b31396d7f0aecaf32d47481cf0cbeb78e7394dcdc
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf099ec439cbdff64f3d3b55ea1f32c5386c40432f4a5418054927a7f60a7a71
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:074f082b7918427797301b29e7c6af54e31efb39ae44b35e4533a95f5b0a9f49
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c992fbbd7cb3ac4ba0d93a3c933e4f1384224ccab41105813a52127e0943be99
3
+ size 14439
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65f237a078b5c1beb61259bf8b7bce0aab72bc1a5221890351cf7a2047a3cdcc
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a56d30c04eda66f1451428a4a1783f0e0b3c6401e9dc47a22a9a23c6f9d71d1c
3
+ size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3427e04a13ecc5863d163d8b4c944bb2837f27676722003cb6abda2606ce2015
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:252bfaee072432d2b9efeeb2414b13c69cfea81ef8749ee867aa8e12e0fa2d52
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dab2092ac253f5c93a298eee50fba2933b65f4ea17b7fc517f028648f502ea43
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9e684c71dc83c29adb7891edadb6f809a0f52fc37575c6edaa71e9c79dd0a26
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f21b3afd8d405fcd9461eae3cafa8a4894a77b6f36c354aa188329ab6dfe547a
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d1c67928001883576d4a56b44f4eee5262f60a7be50b274805186459e2f4ae5
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 5.802678394185105,
5
- "global_step": 380000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -2818,11 +2818,85 @@
2818
  "eval_samples_per_second": 808.112,
2819
  "eval_steps_per_second": 12.93,
2820
  "step": 380000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2821
  }
2822
  ],
2823
  "max_steps": 1000000,
2824
  "num_train_epochs": 16,
2825
- "total_flos": 2.6638066338124477e+22,
2826
  "trial_name": null,
2827
  "trial_params": null
2828
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 5.955380457189976,
5
+ "global_step": 390000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
2818
  "eval_samples_per_second": 808.112,
2819
  "eval_steps_per_second": 12.93,
2820
  "step": 380000
2821
+ },
2822
+ {
2823
+ "epoch": 5.82,
2824
+ "learning_rate": 0.00011208832574099368,
2825
+ "loss": 0.2788,
2826
+ "step": 381000
2827
+ },
2828
+ {
2829
+ "epoch": 5.83,
2830
+ "learning_rate": 0.00011188241916068993,
2831
+ "loss": 0.2785,
2832
+ "step": 382000
2833
+ },
2834
+ {
2835
+ "epoch": 5.85,
2836
+ "learning_rate": 0.00011167616391935826,
2837
+ "loss": 0.2783,
2838
+ "step": 383000
2839
+ },
2840
+ {
2841
+ "epoch": 5.86,
2842
+ "learning_rate": 0.00011146956227257293,
2843
+ "loss": 0.2785,
2844
+ "step": 384000
2845
+ },
2846
+ {
2847
+ "epoch": 5.88,
2848
+ "learning_rate": 0.00011126261647969645,
2849
+ "loss": 0.2781,
2850
+ "step": 385000
2851
+ },
2852
+ {
2853
+ "epoch": 5.88,
2854
+ "eval_runtime": 1.0191,
2855
+ "eval_samples_per_second": 981.273,
2856
+ "eval_steps_per_second": 15.7,
2857
+ "step": 385000
2858
+ },
2859
+ {
2860
+ "epoch": 5.89,
2861
+ "learning_rate": 0.00011105532880385487,
2862
+ "loss": 0.2782,
2863
+ "step": 386000
2864
+ },
2865
+ {
2866
+ "epoch": 5.91,
2867
+ "learning_rate": 0.00011084770151191299,
2868
+ "loss": 0.2782,
2869
+ "step": 387000
2870
+ },
2871
+ {
2872
+ "epoch": 5.92,
2873
+ "learning_rate": 0.00011063973687444962,
2874
+ "loss": 0.2779,
2875
+ "step": 388000
2876
+ },
2877
+ {
2878
+ "epoch": 5.94,
2879
+ "learning_rate": 0.00011043143716573272,
2880
+ "loss": 0.2774,
2881
+ "step": 389000
2882
+ },
2883
+ {
2884
+ "epoch": 5.96,
2885
+ "learning_rate": 0.00011022280466369448,
2886
+ "loss": 0.2776,
2887
+ "step": 390000
2888
+ },
2889
+ {
2890
+ "epoch": 5.96,
2891
+ "eval_runtime": 1.0236,
2892
+ "eval_samples_per_second": 976.954,
2893
+ "eval_steps_per_second": 15.631,
2894
+ "step": 390000
2895
  }
2896
  ],
2897
  "max_steps": 1000000,
2898
  "num_train_epochs": 16,
2899
+ "total_flos": 2.733906894842795e+22,
2900
  "trial_name": null,
2901
  "trial_params": null
2902
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b70ffcb599d0cbcc5aa0449b31396d7f0aecaf32d47481cf0cbeb78e7394dcdc
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf099ec439cbdff64f3d3b55ea1f32c5386c40432f4a5418054927a7f60a7a71
3
  size 449471589