Training in progress, step 35200, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1217,6 +1217,10 @@ You can finetune this model on your own dataset.
|
|
| 1217 |
| 0.6167 | 34900 | 0.3015 |
|
| 1218 |
| 0.6176 | 34950 | 0.3291 |
|
| 1219 |
| 0.6185 | 35000 | 0.2634 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1220 |
|
| 1221 |
|
| 1222 |
### Framework Versions
|
|
|
|
| 1217 |
| 0.6167 | 34900 | 0.3015 |
|
| 1218 |
| 0.6176 | 34950 | 0.3291 |
|
| 1219 |
| 0.6185 | 35000 | 0.2634 |
|
| 1220 |
+
| 0.6194 | 35050 | 0.3212 |
|
| 1221 |
+
| 0.6202 | 35100 | 0.2965 |
|
| 1222 |
+
| 0.6211 | 35150 | 0.3557 |
|
| 1223 |
+
| 0.6220 | 35200 | 0.3535 |
|
| 1224 |
|
| 1225 |
|
| 1226 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a73726096d96dbbbaa9a481dfff6e52b1ea1d694b55f2edc2f1405af8895110b
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8b3f57d97ffd57e518f40f15d12ad037a0066d481b15f01ac0c5cd7db8dcb47
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ca63325ac742a792a3bcdc1dc21baa9c1c96f6a59934e63bc8a87c6b8f66e093
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f6bf385710f1d1a6f64e5b03c0c6f98497de21222ff381a7961ac0b45b93ddc
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f345579e836e5dec04f17da3b053acb614c611f3b7c11559a8cdc45e09194e58
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -4908,6 +4908,34 @@
|
|
| 4908 |
"learning_rate": 2.120908680371483e-05,
|
| 4909 |
"loss": 0.2634,
|
| 4910 |
"step": 35000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4911 |
}
|
| 4912 |
],
|
| 4913 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.622007032920429,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 35200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 4908 |
"learning_rate": 2.120908680371483e-05,
|
| 4909 |
"loss": 0.2634,
|
| 4910 |
"step": 35000
|
| 4911 |
+
},
|
| 4912 |
+
{
|
| 4913 |
+
"epoch": 0.6193564347687794,
|
| 4914 |
+
"grad_norm": 1.4780889749526978,
|
| 4915 |
+
"learning_rate": 2.1160000785376295e-05,
|
| 4916 |
+
"loss": 0.3212,
|
| 4917 |
+
"step": 35050
|
| 4918 |
+
},
|
| 4919 |
+
{
|
| 4920 |
+
"epoch": 0.620239967485996,
|
| 4921 |
+
"grad_norm": 1.699916124343872,
|
| 4922 |
+
"learning_rate": 2.1110914767037756e-05,
|
| 4923 |
+
"loss": 0.2965,
|
| 4924 |
+
"step": 35100
|
| 4925 |
+
},
|
| 4926 |
+
{
|
| 4927 |
+
"epoch": 0.6211235002032125,
|
| 4928 |
+
"grad_norm": 1.6198956966400146,
|
| 4929 |
+
"learning_rate": 2.106182874869922e-05,
|
| 4930 |
+
"loss": 0.3557,
|
| 4931 |
+
"step": 35150
|
| 4932 |
+
},
|
| 4933 |
+
{
|
| 4934 |
+
"epoch": 0.622007032920429,
|
| 4935 |
+
"grad_norm": 1.2697581052780151,
|
| 4936 |
+
"learning_rate": 2.1012742730360685e-05,
|
| 4937 |
+
"loss": 0.3535,
|
| 4938 |
+
"step": 35200
|
| 4939 |
}
|
| 4940 |
],
|
| 4941 |
"logging_steps": 50,
|