Training in progress, step 31800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1295,6 +1295,10 @@ You can finetune this model on your own dataset.
|
|
| 1295 |
| 0.5566 | 31500 | 0.3329 |
|
| 1296 |
| 0.5575 | 31550 | 0.2794 |
|
| 1297 |
| 0.5584 | 31600 | 0.4189 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1298 |
|
| 1299 |
</details>
|
| 1300 |
|
|
|
|
| 1295 |
| 0.5566 | 31500 | 0.3329 |
|
| 1296 |
| 0.5575 | 31550 | 0.2794 |
|
| 1297 |
| 0.5584 | 31600 | 0.4189 |
|
| 1298 |
+
| 0.5593 | 31650 | 0.3643 |
|
| 1299 |
+
| 0.5602 | 31700 | 0.3578 |
|
| 1300 |
+
| 0.5610 | 31750 | 0.3193 |
|
| 1301 |
+
| 0.5619 | 31800 | 0.327 |
|
| 1302 |
|
| 1303 |
</details>
|
| 1304 |
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2aefeca268258dbfb0695a5597c522e31aac7733474d6d58a376815037205ed7
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:30a1ec12177bf3e7a3bcf0d2304d2b35cf56ea3e8b41cc3e1af93291a40fc7ca
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d21026606b47fb76259886267bb47d18484b5815e94d5a5656506546687ec739
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3efc050901e150a59e85c2ab742c4d82ce79ba854a2e4dcd71f14091e10af7e2
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79ef76f1bbf004f2132ce3725824bf2705832e8a1ea3351be51debbf13b28b7d
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4432,6 +4432,34 @@
|
|
| 4432 |
"learning_rate": 2.4544972610001768e-05,
|
| 4433 |
"loss": 0.4189,
|
| 4434 |
"step": 31600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4435 |
}
|
| 4436 |
],
|
| 4437 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.5619268081497057,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 31800,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4432 |
"learning_rate": 2.4544972610001768e-05,
|
| 4433 |
"loss": 0.4189,
|
| 4434 |
"step": 31600
|
| 4435 |
+
},
|
| 4436 |
+
{
|
| 4437 |
+
"epoch": 0.5592762099980563,
|
| 4438 |
+
"grad_norm": 1.5030118227005005,
|
| 4439 |
+
"learning_rate": 2.4495886591663232e-05,
|
| 4440 |
+
"loss": 0.3643,
|
| 4441 |
+
"step": 31650
|
| 4442 |
+
},
|
| 4443 |
+
{
|
| 4444 |
+
"epoch": 0.5601597427152728,
|
| 4445 |
+
"grad_norm": 1.3483951091766357,
|
| 4446 |
+
"learning_rate": 2.4446800573324697e-05,
|
| 4447 |
+
"loss": 0.3578,
|
| 4448 |
+
"step": 31700
|
| 4449 |
+
},
|
| 4450 |
+
{
|
| 4451 |
+
"epoch": 0.5610432754324892,
|
| 4452 |
+
"grad_norm": 1.5314035415649414,
|
| 4453 |
+
"learning_rate": 2.439771455498616e-05,
|
| 4454 |
+
"loss": 0.3193,
|
| 4455 |
+
"step": 31750
|
| 4456 |
+
},
|
| 4457 |
+
{
|
| 4458 |
+
"epoch": 0.5619268081497057,
|
| 4459 |
+
"grad_norm": 1.1020389795303345,
|
| 4460 |
+
"learning_rate": 2.4348628536647623e-05,
|
| 4461 |
+
"loss": 0.327,
|
| 4462 |
+
"step": 31800
|
| 4463 |
}
|
| 4464 |
],
|
| 4465 |
"logging_steps": 50,
|