Kasper7953
commited on
Commit
•
7f41c81
1
Parent(s):
c964019
Training in progress, step 19000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +31 -3
- pytorch_model.bin +1 -1
- runs/Mar11_11-28-52_b25631785753/events.out.tfevents.1678534153.b25631785753.957.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2847145157
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18542fb0f0ca8c5209e2b93103f1880c50a53c82c7835aa17cc9be5a52878bde
|
3 |
size 2847145157
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1524261149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a55bd617d7f0551be9aa43e265f8d49f618cdf19eed0897711e26055a6662e99
|
3 |
size 1524261149
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ec49eaf93dbcc4a7020eab69f82e4825b6de00732c3380cc93bef441b24d358
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ebdd7eec22dd0eaa942c09b9d66a5b538c98524805051b53c9cae7c97f8241a
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -422,11 +422,39 @@
|
|
422 |
"learning_rate": 3.6508769299955035e-05,
|
423 |
"loss": 2.1897,
|
424 |
"step": 18000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
425 |
}
|
426 |
],
|
427 |
"max_steps": 66710,
|
428 |
"num_train_epochs": 10,
|
429 |
-
"total_flos": 2.
|
430 |
"trial_name": null,
|
431 |
"trial_params": null
|
432 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.848148703342827,
|
5 |
+
"global_step": 19000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
422 |
"learning_rate": 3.6508769299955035e-05,
|
423 |
"loss": 2.1897,
|
424 |
"step": 18000
|
425 |
+
},
|
426 |
+
{
|
427 |
+
"epoch": 2.73,
|
428 |
+
"eval_loss": 2.646106719970703,
|
429 |
+
"eval_runtime": 209.741,
|
430 |
+
"eval_samples_per_second": 16.84,
|
431 |
+
"eval_steps_per_second": 5.616,
|
432 |
+
"step": 18200
|
433 |
+
},
|
434 |
+
{
|
435 |
+
"epoch": 2.77,
|
436 |
+
"learning_rate": 3.613401289162045e-05,
|
437 |
+
"loss": 2.181,
|
438 |
+
"step": 18500
|
439 |
+
},
|
440 |
+
{
|
441 |
+
"epoch": 2.83,
|
442 |
+
"eval_loss": 2.6370952129364014,
|
443 |
+
"eval_runtime": 210.1426,
|
444 |
+
"eval_samples_per_second": 16.808,
|
445 |
+
"eval_steps_per_second": 5.606,
|
446 |
+
"step": 18900
|
447 |
+
},
|
448 |
+
{
|
449 |
+
"epoch": 2.85,
|
450 |
+
"learning_rate": 3.5759256483285864e-05,
|
451 |
+
"loss": 2.2077,
|
452 |
+
"step": 19000
|
453 |
}
|
454 |
],
|
455 |
"max_steps": 66710,
|
456 |
"num_train_epochs": 10,
|
457 |
+
"total_flos": 2.5846719817728e+16,
|
458 |
"trial_name": null,
|
459 |
"trial_params": null
|
460 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1524261149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a55bd617d7f0551be9aa43e265f8d49f618cdf19eed0897711e26055a6662e99
|
3 |
size 1524261149
|
runs/Mar11_11-28-52_b25631785753/events.out.tfevents.1678534153.b25631785753.957.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2c6ce822c57a865d868ca2b1ccf414559c129b6fe06a79313875782f814b876
|
3 |
+
size 7964
|