Training in progress, step 460000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +2 -2
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +77 -3
- pytorch_model.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 893439185
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e074c33dcba955530635f7c301cc0616d35e94c4d9e25f501a0d9edd512370f3
|
3 |
size 893439185
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 449471589
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e2e3c76b0bd22486ffeb7f1582064821337785eddce5493639f753ea7af7c21
|
3 |
size 449471589
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f07bf259da4db58c67f5752e41be50bd05dbfaf1912a8b5878788f3ede910eb7
|
3 |
size 14503
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e069aee1aca48a60052a1c66c7d1551fec7d9dcab99912ac030e1863b14f6a1
|
3 |
size 14503
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:642ba2efc3dad359eda3b33bb6c5d67fffdc0e921c5ed6b47ef80068231cbd4a
|
3 |
+
size 14439
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5475a56a8e58f3a6d30456ecb3d60c907f9c5dd05e43f39a9dbfefa6d303c24c
|
3 |
size 14503
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d470fe106a7d346e8d83a1e5754bc519572ca0d497bb4adce56ffd8f58de945f
|
3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -3336,11 +3336,85 @@
|
|
3336 |
"eval_samples_per_second": 1006.215,
|
3337 |
"eval_steps_per_second": 16.099,
|
3338 |
"step": 450000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3339 |
}
|
3340 |
],
|
3341 |
"max_steps": 1000000,
|
3342 |
"num_train_epochs": 16,
|
3343 |
-
"total_flos": 3.
|
3344 |
"trial_name": null,
|
3345 |
"trial_params": null
|
3346 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 7.024294898224075,
|
5 |
+
"global_step": 460000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
3336 |
"eval_samples_per_second": 1006.215,
|
3337 |
"eval_steps_per_second": 16.099,
|
3338 |
"step": 450000
|
3339 |
+
},
|
3340 |
+
{
|
3341 |
+
"epoch": 6.89,
|
3342 |
+
"learning_rate": 9.695948817687504e-05,
|
3343 |
+
"loss": 0.2699,
|
3344 |
+
"step": 451000
|
3345 |
+
},
|
3346 |
+
{
|
3347 |
+
"epoch": 6.9,
|
3348 |
+
"learning_rate": 9.673480678764858e-05,
|
3349 |
+
"loss": 0.2698,
|
3350 |
+
"step": 452000
|
3351 |
+
},
|
3352 |
+
{
|
3353 |
+
"epoch": 6.92,
|
3354 |
+
"learning_rate": 9.650994238925626e-05,
|
3355 |
+
"loss": 0.2699,
|
3356 |
+
"step": 453000
|
3357 |
+
},
|
3358 |
+
{
|
3359 |
+
"epoch": 6.93,
|
3360 |
+
"learning_rate": 9.628489744077911e-05,
|
3361 |
+
"loss": 0.2696,
|
3362 |
+
"step": 454000
|
3363 |
+
},
|
3364 |
+
{
|
3365 |
+
"epoch": 6.95,
|
3366 |
+
"learning_rate": 9.60596744032726e-05,
|
3367 |
+
"loss": 0.2699,
|
3368 |
+
"step": 455000
|
3369 |
+
},
|
3370 |
+
{
|
3371 |
+
"epoch": 6.95,
|
3372 |
+
"eval_runtime": 1.0008,
|
3373 |
+
"eval_samples_per_second": 999.165,
|
3374 |
+
"eval_steps_per_second": 15.987,
|
3375 |
+
"step": 455000
|
3376 |
+
},
|
3377 |
+
{
|
3378 |
+
"epoch": 6.96,
|
3379 |
+
"learning_rate": 9.583427573973982e-05,
|
3380 |
+
"loss": 0.2696,
|
3381 |
+
"step": 456000
|
3382 |
+
},
|
3383 |
+
{
|
3384 |
+
"epoch": 6.98,
|
3385 |
+
"learning_rate": 9.560870391510441e-05,
|
3386 |
+
"loss": 0.2695,
|
3387 |
+
"step": 457000
|
3388 |
+
},
|
3389 |
+
{
|
3390 |
+
"epoch": 6.99,
|
3391 |
+
"learning_rate": 9.538296139618371e-05,
|
3392 |
+
"loss": 0.2691,
|
3393 |
+
"step": 458000
|
3394 |
+
},
|
3395 |
+
{
|
3396 |
+
"epoch": 7.01,
|
3397 |
+
"learning_rate": 9.515705065166178e-05,
|
3398 |
+
"loss": 0.2693,
|
3399 |
+
"step": 459000
|
3400 |
+
},
|
3401 |
+
{
|
3402 |
+
"epoch": 7.02,
|
3403 |
+
"learning_rate": 9.493097415206228e-05,
|
3404 |
+
"loss": 0.2688,
|
3405 |
+
"step": 460000
|
3406 |
+
},
|
3407 |
+
{
|
3408 |
+
"epoch": 7.02,
|
3409 |
+
"eval_runtime": 1.0225,
|
3410 |
+
"eval_samples_per_second": 978.034,
|
3411 |
+
"eval_steps_per_second": 15.649,
|
3412 |
+
"step": 460000
|
3413 |
}
|
3414 |
],
|
3415 |
"max_steps": 1000000,
|
3416 |
"num_train_epochs": 16,
|
3417 |
+
"total_flos": 3.2246074079189274e+22,
|
3418 |
"trial_name": null,
|
3419 |
"trial_params": null
|
3420 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 449471589
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e2e3c76b0bd22486ffeb7f1582064821337785eddce5493639f753ea7af7c21
|
3 |
size 449471589
|