Training in progress, step 624000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +39 -3
- pytorch_model.bin +1 -1
- runs/Jun02_06-43-44_462ae3634d0f/events.out.tfevents.1685689892.462ae3634d0f.537.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3871544599
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bcee279599082c8a68650ad1c53f4bb657d2b897dd2c1d0868612319cde75796
|
3 |
size 3871544599
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1944201353
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53521c1c8772490b5cb2d5d8c6ab3b91167890d8c72a13f392f76a89b461989c
|
3 |
size 1944201353
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee9af1d58327f3b98fb90089b5c903df49f6da59b9a59983147498acfbd86d89
|
3 |
size 14575
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2192f49211bf58ce883df0e7bd405a373cbbb533174fb4185824eab5f8061fbe
|
3 |
size 557
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:498edb01af42115a97b5c07402b6b7000b65b218d39062b591a164029c7f419c
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 16.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -7458,11 +7458,47 @@
|
|
7458 |
"learning_rate": 4.1644903774592405e-07,
|
7459 |
"loss": 1.024,
|
7460 |
"step": 621000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7461 |
}
|
7462 |
],
|
7463 |
"max_steps": 762960,
|
7464 |
"num_train_epochs": 20,
|
7465 |
-
"total_flos": 7.
|
7466 |
"trial_name": null,
|
7467 |
"trial_params": null
|
7468 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 16.35733084480607,
|
5 |
+
"global_step": 624000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
7458 |
"learning_rate": 4.1644903774592405e-07,
|
7459 |
"loss": 1.024,
|
7460 |
"step": 621000
|
7461 |
+
},
|
7462 |
+
{
|
7463 |
+
"epoch": 16.29,
|
7464 |
+
"learning_rate": 4.1361466525607436e-07,
|
7465 |
+
"loss": 1.0129,
|
7466 |
+
"step": 621500
|
7467 |
+
},
|
7468 |
+
{
|
7469 |
+
"epoch": 16.3,
|
7470 |
+
"learning_rate": 4.107834474557934e-07,
|
7471 |
+
"loss": 1.017,
|
7472 |
+
"step": 622000
|
7473 |
+
},
|
7474 |
+
{
|
7475 |
+
"epoch": 16.32,
|
7476 |
+
"learning_rate": 4.079610852866661e-07,
|
7477 |
+
"loss": 1.0148,
|
7478 |
+
"step": 622500
|
7479 |
+
},
|
7480 |
+
{
|
7481 |
+
"epoch": 16.33,
|
7482 |
+
"learning_rate": 4.0514759071193235e-07,
|
7483 |
+
"loss": 1.0082,
|
7484 |
+
"step": 623000
|
7485 |
+
},
|
7486 |
+
{
|
7487 |
+
"epoch": 16.34,
|
7488 |
+
"learning_rate": 4.0234297565724334e-07,
|
7489 |
+
"loss": 1.0035,
|
7490 |
+
"step": 623500
|
7491 |
+
},
|
7492 |
+
{
|
7493 |
+
"epoch": 16.36,
|
7494 |
+
"learning_rate": 3.995472520106156e-07,
|
7495 |
+
"loss": 1.0092,
|
7496 |
+
"step": 624000
|
7497 |
}
|
7498 |
],
|
7499 |
"max_steps": 762960,
|
7500 |
"num_train_epochs": 20,
|
7501 |
+
"total_flos": 7.43349897241215e+17,
|
7502 |
"trial_name": null,
|
7503 |
"trial_params": null
|
7504 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1944201353
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53521c1c8772490b5cb2d5d8c6ab3b91167890d8c72a13f392f76a89b461989c
|
3 |
size 1944201353
|
runs/Jun02_06-43-44_462ae3634d0f/events.out.tfevents.1685689892.462ae3634d0f.537.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d7b987b3a06c1cc0ab77c064205df298771d5c61a72a19389b26c22a6e5a180
|
3 |
+
size 11181
|