Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
dfdd66e
1 Parent(s): 518b813

Training in progress, step 430000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2f3d6b44eb31a5904720c6ef9f3e390e0825c4e9bc44d807b8966079fa39c18
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c4a14a4b300dc1a5da67108d934f51ece4d032d74a5b22ddb6baf522fdb8c1c
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43bdf8dfd2503753ae90f61b7bb9fe12717af35ea212a47dbf67cd5903f5bff5
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a338d7e31f1ebb55d71826f0de824d2a1d8633cac67c074239e146a6c6bf2d
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc2e9e51fe4eee7b642ed745674287b01af0553fd6bc1b8f03d1bfb83d45dd88
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10c521743622eed6f2a8ce22651670cd6f7fb24994288ac8323ec1f5d533e8a1
3
+ size 14439
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7303688061045aa652b3652b66ace516eee8a80cc0cf60b455e243337822a42
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dc65d4d1b61d6b6ec0b07de631a3fc7ef2baef1eecd8b2dd63afdc6d03ed25d
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f87a487e7aba37c8dacc6a7f2504b596187c112ee85cf9f5586b459f5ed62ff7
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2003a4ffe1876cade3b569b7c4b3d4c928a46e1a7a6a797e8245fc18980679e5
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c8eef20e1504bbd40c9a4046a6d63e017b73406d2bc77b0cb51859e2e7910822
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d19681008a4b6b5d37d79f13ad91bb5cfd25c6887d3949264aeea07e7705212
3
+ size 14567
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ecb3d640c7c2649b2bba280f1d77ce8c7f1955289fab0ee4959a38aa2646819
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c41e7c1f83dca8045fba481a590c3c5a6ca39c080efa3c795ba2e0db9ab191b
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 6.41348664620459,
5
- "global_step": 420000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3114,11 +3114,85 @@
3114
  "eval_samples_per_second": 947.861,
3115
  "eval_steps_per_second": 15.166,
3116
  "step": 420000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3117
  }
3118
  ],
3119
  "max_steps": 1000000,
3120
  "num_train_epochs": 16,
3121
- "total_flos": 2.9442070208656875e+22,
3122
  "trial_name": null,
3123
  "trial_params": null
3124
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 6.566188709209461,
5
+ "global_step": 430000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3114
  "eval_samples_per_second": 947.861,
3115
  "eval_steps_per_second": 15.166,
3116
  "step": 420000
3117
+ },
3118
+ {
3119
+ "epoch": 6.43,
3120
+ "learning_rate": 0.00010360272179666802,
3121
+ "loss": 0.2742,
3122
+ "step": 421000
3123
+ },
3124
+ {
3125
+ "epoch": 6.44,
3126
+ "learning_rate": 0.00010338466326683697,
3127
+ "loss": 0.2733,
3128
+ "step": 422000
3129
+ },
3130
+ {
3131
+ "epoch": 6.46,
3132
+ "learning_rate": 0.00010316634900607497,
3133
+ "loss": 0.2737,
3134
+ "step": 423000
3135
+ },
3136
+ {
3137
+ "epoch": 6.47,
3138
+ "learning_rate": 0.00010294778140183182,
3139
+ "loss": 0.2732,
3140
+ "step": 424000
3141
+ },
3142
+ {
3143
+ "epoch": 6.49,
3144
+ "learning_rate": 0.00010272896284432785,
3145
+ "loss": 0.2733,
3146
+ "step": 425000
3147
+ },
3148
+ {
3149
+ "epoch": 6.49,
3150
+ "eval_runtime": 1.0035,
3151
+ "eval_samples_per_second": 996.544,
3152
+ "eval_steps_per_second": 15.945,
3153
+ "step": 425000
3154
+ },
3155
+ {
3156
+ "epoch": 6.51,
3157
+ "learning_rate": 0.00010250989572652766,
3158
+ "loss": 0.2728,
3159
+ "step": 426000
3160
+ },
3161
+ {
3162
+ "epoch": 6.52,
3163
+ "learning_rate": 0.00010229058244411427,
3164
+ "loss": 0.2729,
3165
+ "step": 427000
3166
+ },
3167
+ {
3168
+ "epoch": 6.54,
3169
+ "learning_rate": 0.00010207102539546251,
3170
+ "loss": 0.2728,
3171
+ "step": 428000
3172
+ },
3173
+ {
3174
+ "epoch": 6.55,
3175
+ "learning_rate": 0.00010185122698161311,
3176
+ "loss": 0.2726,
3177
+ "step": 429000
3178
+ },
3179
+ {
3180
+ "epoch": 6.57,
3181
+ "learning_rate": 0.00010163118960624632,
3182
+ "loss": 0.2725,
3183
+ "step": 430000
3184
+ },
3185
+ {
3186
+ "epoch": 6.57,
3187
+ "eval_runtime": 1.0983,
3188
+ "eval_samples_per_second": 910.508,
3189
+ "eval_steps_per_second": 14.568,
3190
+ "step": 430000
3191
  }
3192
  ],
3193
  "max_steps": 1000000,
3194
  "num_train_epochs": 16,
3195
+ "total_flos": 3.0143072818960347e+22,
3196
  "trial_name": null,
3197
  "trial_params": null
3198
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43bdf8dfd2503753ae90f61b7bb9fe12717af35ea212a47dbf67cd5903f5bff5
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29a338d7e31f1ebb55d71826f0de824d2a1d8633cac67c074239e146a6c6bf2d
3
  size 449471589