Transformers
PyTorch
English
pixel
pretraining
Inference Endpoints
plip commited on
Commit
d64ffb3
1 Parent(s): 1577352

Training in progress, step 460000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30290edc8628fd3c3ef18b3c5aeed7f069b37f58cee15ba21ffc0026c01c3730
3
  size 893439185
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e074c33dcba955530635f7c301cc0616d35e94c4d9e25f501a0d9edd512370f3
3
  size 893439185
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd9bd4abec55ec3aff5c6a63e004f193b84327f4dea19bd4c7a418c248e58ed7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e2e3c76b0bd22486ffeb7f1582064821337785eddce5493639f753ea7af7c21
3
  size 449471589
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33d4cd7454368d736d737996ed03879986986a143829539c951d1987c1b5985b
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f07bf259da4db58c67f5752e41be50bd05dbfaf1912a8b5878788f3ede910eb7
3
  size 14503
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7336b286bfd4476ee4aa817ed5f237f90f8c52aba8afeb7d24431d41ce3a20dc
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e069aee1aca48a60052a1c66c7d1551fec7d9dcab99912ac030e1863b14f6a1
3
  size 14503
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d3e44169554700b12ce1323e27998dd02eb610802144e6e40dc2e6668fa701b
3
- size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:642ba2efc3dad359eda3b33bb6c5d67fffdc0e921c5ed6b47ef80068231cbd4a
3
+ size 14439
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b37e67e1cf58930910192e85abdd9cbaabe8e6e23dc6148e7d6f7fcf570a387a
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5475a56a8e58f3a6d30456ecb3d60c907f9c5dd05e43f39a9dbfefa6d303c24c
3
  size 14503
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ca5b8ec583e6ebb62b2f3066d6bca2c46b8614e9cfbd4e5e7bfdb3a9d7a2d86
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d470fe106a7d346e8d83a1e5754bc519572ca0d497bb4adce56ffd8f58de945f
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 6.871592835219204,
5
- "global_step": 450000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -3336,11 +3336,85 @@
3336
  "eval_samples_per_second": 1006.215,
3337
  "eval_steps_per_second": 16.099,
3338
  "step": 450000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3339
  }
3340
  ],
3341
  "max_steps": 1000000,
3342
  "num_train_epochs": 16,
3343
- "total_flos": 3.154507803956729e+22,
3344
  "trial_name": null,
3345
  "trial_params": null
3346
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 7.024294898224075,
5
+ "global_step": 460000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
3336
  "eval_samples_per_second": 1006.215,
3337
  "eval_steps_per_second": 16.099,
3338
  "step": 450000
3339
+ },
3340
+ {
3341
+ "epoch": 6.89,
3342
+ "learning_rate": 9.695948817687504e-05,
3343
+ "loss": 0.2699,
3344
+ "step": 451000
3345
+ },
3346
+ {
3347
+ "epoch": 6.9,
3348
+ "learning_rate": 9.673480678764858e-05,
3349
+ "loss": 0.2698,
3350
+ "step": 452000
3351
+ },
3352
+ {
3353
+ "epoch": 6.92,
3354
+ "learning_rate": 9.650994238925626e-05,
3355
+ "loss": 0.2699,
3356
+ "step": 453000
3357
+ },
3358
+ {
3359
+ "epoch": 6.93,
3360
+ "learning_rate": 9.628489744077911e-05,
3361
+ "loss": 0.2696,
3362
+ "step": 454000
3363
+ },
3364
+ {
3365
+ "epoch": 6.95,
3366
+ "learning_rate": 9.60596744032726e-05,
3367
+ "loss": 0.2699,
3368
+ "step": 455000
3369
+ },
3370
+ {
3371
+ "epoch": 6.95,
3372
+ "eval_runtime": 1.0008,
3373
+ "eval_samples_per_second": 999.165,
3374
+ "eval_steps_per_second": 15.987,
3375
+ "step": 455000
3376
+ },
3377
+ {
3378
+ "epoch": 6.96,
3379
+ "learning_rate": 9.583427573973982e-05,
3380
+ "loss": 0.2696,
3381
+ "step": 456000
3382
+ },
3383
+ {
3384
+ "epoch": 6.98,
3385
+ "learning_rate": 9.560870391510441e-05,
3386
+ "loss": 0.2695,
3387
+ "step": 457000
3388
+ },
3389
+ {
3390
+ "epoch": 6.99,
3391
+ "learning_rate": 9.538296139618371e-05,
3392
+ "loss": 0.2691,
3393
+ "step": 458000
3394
+ },
3395
+ {
3396
+ "epoch": 7.01,
3397
+ "learning_rate": 9.515705065166178e-05,
3398
+ "loss": 0.2693,
3399
+ "step": 459000
3400
+ },
3401
+ {
3402
+ "epoch": 7.02,
3403
+ "learning_rate": 9.493097415206228e-05,
3404
+ "loss": 0.2688,
3405
+ "step": 460000
3406
+ },
3407
+ {
3408
+ "epoch": 7.02,
3409
+ "eval_runtime": 1.0225,
3410
+ "eval_samples_per_second": 978.034,
3411
+ "eval_steps_per_second": 15.649,
3412
+ "step": 460000
3413
  }
3414
  ],
3415
  "max_steps": 1000000,
3416
  "num_train_epochs": 16,
3417
+ "total_flos": 3.2246074079189274e+22,
3418
  "trial_name": null,
3419
  "trial_params": null
3420
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd9bd4abec55ec3aff5c6a63e004f193b84327f4dea19bd4c7a418c248e58ed7
3
  size 449471589
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e2e3c76b0bd22486ffeb7f1582064821337785eddce5493639f753ea7af7c21
3
  size 449471589