Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
da61d73
1 Parent(s): e542e3e

Training in progress, step 130000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcc09d22e5596eeac7cbb0a1dabfeacc19af29a548e591c9f749208980b7916a
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eeef6904cfa32f848b9f1346c4e3c74b0fca915a351a8997e9e3c00ba9dcbbc5
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca3c3ce97bc1c8862c7db669723fd31e2c4926cda5ff7010a6c07f89d409cca1
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd16d9355565127d935e0581e06272701548caedebf90cbf8e7ec4700d308c92
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7fc306b40ea32fc4b974d92fa4436f6126d03d93634b99c4944393049e4dd34d
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c3369fb2b68cab39ce1c39a70e82cbae407ebef20a3614cae5eb0b8e29d67bb
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:83b1dc502294b82568367d2e77a4231f6fb11b7296d845de6be2991e1953c467
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adc589057b5ab70a677240ea7ff1b31050aa971f7175362abbce011dcf3e27e4
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90c7dcc243e1aa80b2e25ba58bbf11ac2e612d08701ac3bc19fe812cf11394f0
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a41a3d1e1a810c6ca0c122b02d703e10618433c01e7c57fdc5c7f1070e2b8072
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b63f502697a67e82fe85208c9b5cb87051cc2490893eb283cf394fd4c0f8586c
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1078dca16195c4c6a10dd246658bec7f4ef493b51f155eaecbd40e7b74829373
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27556e6e847d06ad2f934e5a134bda54baf3ade1f4eea8c1e651de3a5e1bb425
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0714a313dd4ce4e99c82bf70e5eccb41f6003fe208bd22b2e683fd5e729c762a
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.8324247560584543,
5
- "global_step": 120000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -894,11 +894,85 @@
894
  "eval_samples_per_second": 943.744,
895
  "eval_steps_per_second": 15.1,
896
  "step": 120000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
897
  }
898
  ],
899
  "max_steps": 1000000,
900
  "num_train_epochs": 16,
901
- "total_flos": 8.41202475296017e+21,
902
  "trial_name": null,
903
  "trial_params": null
904
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.9851268190633256,
5
+ "global_step": 130000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
894
  "eval_samples_per_second": 943.744,
895
  "eval_steps_per_second": 15.1,
896
  "step": 120000
897
+ },
898
+ {
899
+ "epoch": 1.85,
900
+ "learning_rate": 0.0001480793809853123,
901
+ "loss": 0.3478,
902
+ "step": 121000
903
+ },
904
+ {
905
+ "epoch": 1.86,
906
+ "learning_rate": 0.00014802515565806107,
907
+ "loss": 0.3468,
908
+ "step": 122000
909
+ },
910
+ {
911
+ "epoch": 1.88,
912
+ "learning_rate": 0.00014797018641860612,
913
+ "loss": 0.346,
914
+ "step": 123000
915
+ },
916
+ {
917
+ "epoch": 1.89,
918
+ "learning_rate": 0.0001479144738680823,
919
+ "loss": 0.3474,
920
+ "step": 124000
921
+ },
922
+ {
923
+ "epoch": 1.91,
924
+ "learning_rate": 0.00014785801861575312,
925
+ "loss": 0.3447,
926
+ "step": 125000
927
+ },
928
+ {
929
+ "epoch": 1.91,
930
+ "eval_runtime": 0.9375,
931
+ "eval_samples_per_second": 1066.699,
932
+ "eval_steps_per_second": 17.067,
933
+ "step": 125000
934
+ },
935
+ {
936
+ "epoch": 1.92,
937
+ "learning_rate": 0.00014780082127900416,
938
+ "loss": 0.3439,
939
+ "step": 126000
940
+ },
941
+ {
942
+ "epoch": 1.94,
943
+ "learning_rate": 0.00014774288248333635,
944
+ "loss": 0.3436,
945
+ "step": 127000
946
+ },
947
+ {
948
+ "epoch": 1.95,
949
+ "learning_rate": 0.00014768420286235908,
950
+ "loss": 0.3429,
951
+ "step": 128000
952
+ },
953
+ {
954
+ "epoch": 1.97,
955
+ "learning_rate": 0.00014762478305778328,
956
+ "loss": 0.3422,
957
+ "step": 129000
958
+ },
959
+ {
960
+ "epoch": 1.99,
961
+ "learning_rate": 0.0001475646237194144,
962
+ "loss": 0.3414,
963
+ "step": 130000
964
+ },
965
+ {
966
+ "epoch": 1.99,
967
+ "eval_runtime": 1.0085,
968
+ "eval_samples_per_second": 991.553,
969
+ "eval_steps_per_second": 15.865,
970
+ "step": 130000
971
  }
972
  ],
973
  "max_steps": 1000000,
974
  "num_train_epochs": 16,
975
+ "total_flos": 9.113027363263641e+21,
976
  "trial_name": null,
977
  "trial_params": null
978
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca3c3ce97bc1c8862c7db669723fd31e2c4926cda5ff7010a6c07f89d409cca1
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dd16d9355565127d935e0581e06272701548caedebf90cbf8e7ec4700d308c92
3
  size 449471589