Training in progress, step 38600, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1285,6 +1285,10 @@ You can finetune this model on your own dataset.
|
|
| 1285 |
| 0.6768 | 38300 | 0.3098 |
|
| 1286 |
| 0.6777 | 38350 | 0.2837 |
|
| 1287 |
| 0.6786 | 38400 | 0.2998 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1288 |
|
| 1289 |
|
| 1290 |
### Framework Versions
|
|
|
|
| 1285 |
| 0.6768 | 38300 | 0.3098 |
|
| 1286 |
| 0.6777 | 38350 | 0.2837 |
|
| 1287 |
| 0.6786 | 38400 | 0.2998 |
|
| 1288 |
+
| 0.6794 | 38450 | 0.2477 |
|
| 1289 |
+
| 0.6803 | 38500 | 0.3343 |
|
| 1290 |
+
| 0.6812 | 38550 | 0.2411 |
|
| 1291 |
+
| 0.6821 | 38600 | 0.2641 |
|
| 1292 |
|
| 1293 |
|
| 1294 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9411645577be70106bcbbb74c24716149dda56d2f3e7a581b79fdcdc3ed41249
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3e25051f1943dbef57f8ebb6e352941619afea10b29f67080e5c0e931b5bcec
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:383863d97b21487295b0694693e6eddac2a40d27317755b362907c5201542167
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c584d258d651b75cc67fda371e341a5dcb6a64a5f3ef27cdd2725022fe4132e
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10f4be9189e6431a4a4fa709ab0080899a72a8630fa75a31259beca939bff08e
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -5384,6 +5384,34 @@
|
|
| 5384 |
"learning_rate": 1.7872219277061123e-05,
|
| 5385 |
"loss": 0.2998,
|
| 5386 |
"step": 38400
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5387 |
}
|
| 5388 |
],
|
| 5389 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.6820872576911523,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 38600,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 5384 |
"learning_rate": 1.7872219277061123e-05,
|
| 5385 |
"loss": 0.2998,
|
| 5386 |
"step": 38400
|
| 5387 |
+
},
|
| 5388 |
+
{
|
| 5389 |
+
"epoch": 0.6794366595395027,
|
| 5390 |
+
"grad_norm": 1.5092830657958984,
|
| 5391 |
+
"learning_rate": 1.7823133258722584e-05,
|
| 5392 |
+
"loss": 0.2477,
|
| 5393 |
+
"step": 38450
|
| 5394 |
+
},
|
| 5395 |
+
{
|
| 5396 |
+
"epoch": 0.6803201922567192,
|
| 5397 |
+
"grad_norm": 1.4017945528030396,
|
| 5398 |
+
"learning_rate": 1.7774047240384052e-05,
|
| 5399 |
+
"loss": 0.3343,
|
| 5400 |
+
"step": 38500
|
| 5401 |
+
},
|
| 5402 |
+
{
|
| 5403 |
+
"epoch": 0.6812037249739358,
|
| 5404 |
+
"grad_norm": 1.5817060470581055,
|
| 5405 |
+
"learning_rate": 1.7724961222045513e-05,
|
| 5406 |
+
"loss": 0.2411,
|
| 5407 |
+
"step": 38550
|
| 5408 |
+
},
|
| 5409 |
+
{
|
| 5410 |
+
"epoch": 0.6820872576911523,
|
| 5411 |
+
"grad_norm": 1.4471608400344849,
|
| 5412 |
+
"learning_rate": 1.7675875203706975e-05,
|
| 5413 |
+
"loss": 0.2641,
|
| 5414 |
+
"step": 38600
|
| 5415 |
}
|
| 5416 |
],
|
| 5417 |
"logging_steps": 50,
|