NightMachinery
commited on
Commit
·
a85ca50
1
Parent(s):
44f59c2
Training in progress, step 10500
Browse files- last-checkpoint/mlm/pytorch_adapter.bin +1 -1
- last-checkpoint/mlm/pytorch_model_head.bin +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +20 -5
- runs/Mar03_09-29-00_375a4f73e1b6/events.out.tfevents.1677835778.375a4f73e1b6.4551.0 +2 -2
last-checkpoint/mlm/pytorch_adapter.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4782029
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab31d3c1e44d96d6aa7dc385bb2a374bb3650411b1f2bbf3a5632cf6d8a364dd
|
3 |
size 4782029
|
last-checkpoint/mlm/pytorch_model_head.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 771377007
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5a68f21c96d1017414c75ab9cb39667b15070c234626b171849d4374c8815f2
|
3 |
size 771377007
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 16297733
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c879fb2ff43e64a5330a90d7721d2020e0ba4b2bfa608256284bd1443f844131
|
3 |
size 16297733
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b9699ad8a13d39e0088b256bc19bede304b6e109e99940bf7c075c82acfc186a
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13f27483992a93e2d0e00be6d9edd9ab2fa3162b3b09ab3826e3fa33ba45c5fe
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
-
"best_metric": 1.
|
3 |
-
"best_model_checkpoint": "./test-mlm/checkpoint-
|
4 |
-
"epoch": 7.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -306,11 +306,26 @@
|
|
306 |
"eval_samples_per_second": 10.62,
|
307 |
"eval_steps_per_second": 2.127,
|
308 |
"step": 10000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
309 |
}
|
310 |
],
|
311 |
"max_steps": 13520,
|
312 |
"num_train_epochs": 10,
|
313 |
-
"total_flos": 1.
|
314 |
"trial_name": null,
|
315 |
"trial_params": null
|
316 |
}
|
|
|
1 |
{
|
2 |
+
"best_metric": 1.9753360748291016,
|
3 |
+
"best_model_checkpoint": "./test-mlm/checkpoint-10500",
|
4 |
+
"epoch": 7.766272189349112,
|
5 |
+
"global_step": 10500,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
306 |
"eval_samples_per_second": 10.62,
|
307 |
"eval_steps_per_second": 2.127,
|
308 |
"step": 10000
|
309 |
+
},
|
310 |
+
{
|
311 |
+
"epoch": 7.77,
|
312 |
+
"learning_rate": 2.2337278106508877e-05,
|
313 |
+
"loss": 2.0887,
|
314 |
+
"step": 10500
|
315 |
+
},
|
316 |
+
{
|
317 |
+
"epoch": 7.77,
|
318 |
+
"eval_accuracy": 0.5924927994053703,
|
319 |
+
"eval_loss": 1.9753360748291016,
|
320 |
+
"eval_runtime": 81.7861,
|
321 |
+
"eval_samples_per_second": 10.625,
|
322 |
+
"eval_steps_per_second": 2.128,
|
323 |
+
"step": 10500
|
324 |
}
|
325 |
],
|
326 |
"max_steps": 13520,
|
327 |
"num_train_epochs": 10,
|
328 |
+
"total_flos": 1.4038178060648448e+16,
|
329 |
"trial_name": null,
|
330 |
"trial_params": null
|
331 |
}
|
runs/Mar03_09-29-00_375a4f73e1b6/events.out.tfevents.1677835778.375a4f73e1b6.4551.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b869a8447d8ff33826cbddda19026ca1771b64cc0c9fba4809c94e5c091d71e3
|
3 |
+
size 15095
|