Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
b6a1c3c
1 Parent(s): 4d400fb

Training in progress, step 540000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00b387d4f9f04e8c9303a92c0ddb4fecebb2d329d1bad50fe16824cce0afa53f
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cce3705a1c8b8d8d4264e967a6f95acb36457da2099b2e0f10708b7bc8b02f7
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1625f5e23d8f1ad41b87b90859c51a9a7e8e0c2f203d02de268a294a2c0644e2
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10387ca16d2be862ac39f8a7dd403935e8f63c843663bd6c250c84cc9afccb17
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f39691b2c245489425bdb803bff6f96b52586788af71785b57e3d212e063166a
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d6a05599d68c81d8f28a8a18f0fba06e8b974a2ea269e8529ff0449633b1df0
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af7326fef653b7a70f9f155f4acb1e3ee4232444cd6d9204bc168a2d2e45c727
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa440e15eff2f549811ca7872de21865d48dd11cb8b6542ab71253c6945d2c0d
3
+ size 14567
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee1218ce9b7108b8255e87b249fdf7f16f07137f90939e9084af13b071ce6ffe
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24051c040fbf1ab84f4d62008b8fd2ab04d63f18b11e30fd62216b89cf665574
3
+ size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9c5bbfb1027111f06815f4497b89bb272c0861b51bd6d39c91af85222b32d16
3
- size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28fbe9c447e2dbc1b0d90d8fb5fa32bb60a8b179ed5bdf4dc956ff563b72c4fc
3
+ size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:286366dc95c1888d75c773db3569adfce838dc105f2552542e8252bf7ab19ebf
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:312a9240a59bfb6f588851dc4640a2bea628ee45c54031017e35bcac8788a581
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 8.093209339258173,
5
- "global_step": 530000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3928,11 +3928,85 @@
3928
  "eval_samples_per_second": 986.75,
3929
  "eval_steps_per_second": 15.788,
3930
  "step": 530000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3931
  }
3932
  ],
3933
  "max_steps": 1000000,
3934
  "num_train_epochs": 16,
3935
- "total_flos": 3.7153085780632086e+22,
3936
  "trial_name": null,
3937
  "trial_params": null
3938
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 8.245911402263044,
5
+ "global_step": 540000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3928
  "eval_samples_per_second": 986.75,
3929
  "eval_steps_per_second": 15.788,
3930
  "step": 530000
3931
+ },
3932
+ {
3933
+ "epoch": 8.11,
3934
+ "learning_rate": 7.861117648512725e-05,
3935
+ "loss": 0.2613,
3936
+ "step": 531000
3937
+ },
3938
+ {
3939
+ "epoch": 8.12,
3940
+ "learning_rate": 7.837974429185103e-05,
3941
+ "loss": 0.2614,
3942
+ "step": 532000
3943
+ },
3944
+ {
3945
+ "epoch": 8.14,
3946
+ "learning_rate": 7.814832981743164e-05,
3947
+ "loss": 0.2614,
3948
+ "step": 533000
3949
+ },
3950
+ {
3951
+ "epoch": 8.15,
3952
+ "learning_rate": 7.791693559258072e-05,
3953
+ "loss": 0.2608,
3954
+ "step": 534000
3955
+ },
3956
+ {
3957
+ "epoch": 8.17,
3958
+ "learning_rate": 7.768556414778842e-05,
3959
+ "loss": 0.2606,
3960
+ "step": 535000
3961
+ },
3962
+ {
3963
+ "epoch": 8.17,
3964
+ "eval_runtime": 1.097,
3965
+ "eval_samples_per_second": 911.552,
3966
+ "eval_steps_per_second": 14.585,
3967
+ "step": 535000
3968
+ },
3969
+ {
3970
+ "epoch": 8.18,
3971
+ "learning_rate": 7.74542180132958e-05,
3972
+ "loss": 0.2606,
3973
+ "step": 536000
3974
+ },
3975
+ {
3976
+ "epoch": 8.2,
3977
+ "learning_rate": 7.72228997190671e-05,
3978
+ "loss": 0.2608,
3979
+ "step": 537000
3980
+ },
3981
+ {
3982
+ "epoch": 8.22,
3983
+ "learning_rate": 7.699161179476217e-05,
3984
+ "loss": 0.2604,
3985
+ "step": 538000
3986
+ },
3987
+ {
3988
+ "epoch": 8.23,
3989
+ "learning_rate": 7.676035676970863e-05,
3990
+ "loss": 0.2606,
3991
+ "step": 539000
3992
+ },
3993
+ {
3994
+ "epoch": 8.25,
3995
+ "learning_rate": 7.652913717287443e-05,
3996
+ "loss": 0.2604,
3997
+ "step": 540000
3998
+ },
3999
+ {
4000
+ "epoch": 8.25,
4001
+ "eval_runtime": 1.1778,
4002
+ "eval_samples_per_second": 849.063,
4003
+ "eval_steps_per_second": 13.585,
4004
+ "step": 540000
4005
  }
4006
  ],
4007
  "max_steps": 1000000,
4008
  "num_train_epochs": 16,
4009
+ "total_flos": 3.785408839093556e+22,
4010
  "trial_name": null,
4011
  "trial_params": null
4012
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1625f5e23d8f1ad41b87b90859c51a9a7e8e0c2f203d02de268a294a2c0644e2
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10387ca16d2be862ac39f8a7dd403935e8f63c843663bd6c250c84cc9afccb17
3
  size 449471589