Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
9ccd2d1
1 Parent(s): dcf1daf

Training in progress, step 990000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:90e6f74ca02156084fa05f854168c4cbdee8fc0fa6687cea7dfffc7ceaa970ef
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cbfc1ed883942984be588c84681fbb0b292e529986dcbab5a1fecaa3f6ad447
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44a8bb7d1ad03b47ab97301f2bf5aa4416e913d62ffabd09bdd937d55c43233d
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc73418bd52c0694a19af6083331d7a4a133f36616e77cb56fc9fc0bb18ad264
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2693c812482df2fdf768d0c19e41d192e583b64a43dbe767a2677f629f2520e7
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3cbe84c4b275ece4dfc8b045971a9447b9468599c6de1ac7856d818ab7fcce6
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39770cef90df6052fa5bdc49403a83d0e05cc2d3766019022596476c4a73f3b2
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ca4b049386ceb25b5284b9754462b13ddabb069762bc1b4ce1a9e94d95e348c
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:708a00e78f0bdafbd2eb890af573c704006de2c61a1f639e3fb47ce38e039820
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:733172b1d4a99d1dcac219cdba47537d2e3c42c728e60a468833c7a7eb409d93
3
  size 14503
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3d789d948e2afb641edc41de23d3e0ac8454e4ca3cace740853515e0185e05d
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1a20d0d880982442a49c1adeca0b36b7c4aa9ce9768b58e40b03f2358d78bf3
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1f60f9446cba0320cf9ced93c4b14816af8d6988d011f7cc2f5b01e8ada101d
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2358905887cd0ce80c53b6e8a0174e039c4c5bd62c6c91c86f0312f9b46fcf7
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 14.964802174477377,
5
- "global_step": 980000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -7258,11 +7258,85 @@
7258
  "eval_samples_per_second": 1335.226,
7259
  "eval_steps_per_second": 21.364,
7260
  "step": 980000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7261
  }
7262
  ],
7263
  "max_steps": 1000000,
7264
  "num_train_epochs": 16,
7265
- "total_flos": 6.869816382019938e+22,
7266
  "trial_name": null,
7267
  "trial_params": null
7268
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 15.11750423748225,
5
+ "global_step": 990000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
7258
  "eval_samples_per_second": 1335.226,
7259
  "eval_steps_per_second": 21.364,
7260
  "step": 980000
7261
+ },
7262
+ {
7263
+ "epoch": 14.98,
7264
+ "learning_rate": 1.0138129010020992e-05,
7265
+ "loss": 0.2272,
7266
+ "step": 981000
7267
+ },
7268
+ {
7269
+ "epoch": 15.0,
7270
+ "learning_rate": 1.0123975923584488e-05,
7271
+ "loss": 0.2273,
7272
+ "step": 982000
7273
+ },
7274
+ {
7275
+ "epoch": 15.01,
7276
+ "learning_rate": 1.0110586990152152e-05,
7277
+ "loss": 0.227,
7278
+ "step": 983000
7279
+ },
7280
+ {
7281
+ "epoch": 15.03,
7282
+ "learning_rate": 1.0097962356143219e-05,
7283
+ "loss": 0.2273,
7284
+ "step": 984000
7285
+ },
7286
+ {
7287
+ "epoch": 15.04,
7288
+ "learning_rate": 1.0086102159618668e-05,
7289
+ "loss": 0.227,
7290
+ "step": 985000
7291
+ },
7292
+ {
7293
+ "epoch": 15.04,
7294
+ "eval_runtime": 0.7868,
7295
+ "eval_samples_per_second": 1271.022,
7296
+ "eval_steps_per_second": 20.336,
7297
+ "step": 985000
7298
+ },
7299
+ {
7300
+ "epoch": 15.06,
7301
+ "learning_rate": 1.0075006530279694e-05,
7302
+ "loss": 0.2271,
7303
+ "step": 986000
7304
+ },
7305
+ {
7306
+ "epoch": 15.07,
7307
+ "learning_rate": 1.0064675589466339e-05,
7308
+ "loss": 0.2268,
7309
+ "step": 987000
7310
+ },
7311
+ {
7312
+ "epoch": 15.09,
7313
+ "learning_rate": 1.0055109450156098e-05,
7314
+ "loss": 0.2272,
7315
+ "step": 988000
7316
+ },
7317
+ {
7318
+ "epoch": 15.1,
7319
+ "learning_rate": 1.0046308216962759e-05,
7320
+ "loss": 0.2269,
7321
+ "step": 989000
7322
+ },
7323
+ {
7324
+ "epoch": 15.12,
7325
+ "learning_rate": 1.0038271986135177e-05,
7326
+ "loss": 0.2272,
7327
+ "step": 990000
7328
+ },
7329
+ {
7330
+ "epoch": 15.12,
7331
+ "eval_runtime": 0.7713,
7332
+ "eval_samples_per_second": 1296.438,
7333
+ "eval_steps_per_second": 20.743,
7334
+ "step": 990000
7335
  }
7336
  ],
7337
  "max_steps": 1000000,
7338
  "num_train_epochs": 16,
7339
+ "total_flos": 6.939915985982136e+22,
7340
  "trial_name": null,
7341
  "trial_params": null
7342
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44a8bb7d1ad03b47ab97301f2bf5aa4416e913d62ffabd09bdd937d55c43233d
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc73418bd52c0694a19af6083331d7a4a133f36616e77cb56fc9fc0bb18ad264
3
  size 449471589