Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
17dde6c
1 Parent(s): eef34d9

Training in progress, step 560000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c26dfdb95640433391e289b9d54c29ba637889e22ac54f90b0e4758926e0b34
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8ab35ed4dfefd8dd33fb26f0ecf541378b45831852a54aeb8f775b92df21738
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:affd4afd21029b52701e8d0046ed5d64853de0037c32a35ed3d7e452fd7c0e84
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5321ac05ebfcc017f8c041dae493ee5ce4f8eaceb97ac0dbd2e5b7ff1909ad9f
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:668a667c0141b3007fbd5f23f3195d50d9a952d3b42af4d471955e90b35901bf
3
- size 14439
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c595110edd758e9e0a71c6845041a2d22c5cf58679d14f120b5cb63abc84493
3
+ size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed9a47d2a307e89814d3463ee5fc48f3b3365083fd9c82a5f581a3087e2941c8
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:715147c7486ebd169cb8e58f73bc4aa6a8bc3129e6581c29e50cbdd2f06aae29
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e8a638d577539d28ce2053ec5b75e3eed1d5ad4a147b887facb578c40f25088
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2da28d7b7099d5f85e00929347b66a092dbe7cfdb67ae3df05ae5bcb6ee3a235
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30723df40dcd4e911f2e4b8fee07e2767c8ee7ced5c90fa064aabaf279f01230
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18d187c6fad30982ef7c6cac2865f72e7d2e1a26561d9ab8f74149dc0f5b946f
3
+ size 14439
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8de7df7ff53e44669a043f69e39b55baa82d81ac1777f09e2f6159ffcb51dd66
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af9a25b33d29c3fd157c79676adec6abbe35f3978d907c7efc857fe0437c64ac
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 8.398613465267916,
5
- "global_step": 550000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -4076,11 +4076,85 @@
4076
  "eval_samples_per_second": 1010.184,
4077
  "eval_steps_per_second": 16.163,
4078
  "step": 550000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4079
  }
4080
  ],
4081
  "max_steps": 1000000,
4082
  "num_train_epochs": 16,
4083
- "total_flos": 3.855509100123903e+22,
4084
  "trial_name": null,
4085
  "trial_params": null
4086
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 8.551315528272786,
5
+ "global_step": 560000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
4076
  "eval_samples_per_second": 1010.184,
4077
  "eval_steps_per_second": 16.163,
4078
  "step": 550000
4079
+ },
4080
+ {
4081
+ "epoch": 8.41,
4082
+ "learning_rate": 7.39887827118248e-05,
4083
+ "loss": 0.259,
4084
+ "step": 551000
4085
+ },
4086
+ {
4087
+ "epoch": 8.43,
4088
+ "learning_rate": 7.375818534442207e-05,
4089
+ "loss": 0.2588,
4090
+ "step": 552000
4091
+ },
4092
+ {
4093
+ "epoch": 8.44,
4094
+ "learning_rate": 7.352765623650435e-05,
4095
+ "loss": 0.259,
4096
+ "step": 553000
4097
+ },
4098
+ {
4099
+ "epoch": 8.46,
4100
+ "learning_rate": 7.329719790910108e-05,
4101
+ "loss": 0.2587,
4102
+ "step": 554000
4103
+ },
4104
+ {
4105
+ "epoch": 8.47,
4106
+ "learning_rate": 7.30668128824676e-05,
4107
+ "loss": 0.2587,
4108
+ "step": 555000
4109
+ },
4110
+ {
4111
+ "epoch": 8.47,
4112
+ "eval_runtime": 1.1635,
4113
+ "eval_samples_per_second": 859.466,
4114
+ "eval_steps_per_second": 13.751,
4115
+ "step": 555000
4116
+ },
4117
+ {
4118
+ "epoch": 8.49,
4119
+ "learning_rate": 7.283650367605764e-05,
4120
+ "loss": 0.2584,
4121
+ "step": 556000
4122
+ },
4123
+ {
4124
+ "epoch": 8.51,
4125
+ "learning_rate": 7.260627280849581e-05,
4126
+ "loss": 0.2585,
4127
+ "step": 557000
4128
+ },
4129
+ {
4130
+ "epoch": 8.52,
4131
+ "learning_rate": 7.23761227975499e-05,
4132
+ "loss": 0.2584,
4133
+ "step": 558000
4134
+ },
4135
+ {
4136
+ "epoch": 8.54,
4137
+ "learning_rate": 7.21460561601037e-05,
4138
+ "loss": 0.2584,
4139
+ "step": 559000
4140
+ },
4141
+ {
4142
+ "epoch": 8.55,
4143
+ "learning_rate": 7.191607541212897e-05,
4144
+ "loss": 0.2585,
4145
+ "step": 560000
4146
+ },
4147
+ {
4148
+ "epoch": 8.55,
4149
+ "eval_runtime": 1.1711,
4150
+ "eval_samples_per_second": 853.863,
4151
+ "eval_steps_per_second": 13.662,
4152
+ "step": 560000
4153
  }
4154
  ],
4155
  "max_steps": 1000000,
4156
  "num_train_epochs": 16,
4157
+ "total_flos": 3.92560936115425e+22,
4158
  "trial_name": null,
4159
  "trial_params": null
4160
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:affd4afd21029b52701e8d0046ed5d64853de0037c32a35ed3d7e452fd7c0e84
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5321ac05ebfcc017f8c041dae493ee5ce4f8eaceb97ac0dbd2e5b7ff1909ad9f
3
  size 449471589