Training in progress, step 990000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state_0.pth +1 -1
- last-checkpoint/rng_state_1.pth +1 -1
- last-checkpoint/rng_state_2.pth +1 -1
- last-checkpoint/rng_state_3.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +77 -3
- pytorch_model.bin +1 -1
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 893439185
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cbfc1ed883942984be588c84681fbb0b292e529986dcbab5a1fecaa3f6ad447
|
3 |
size 893439185
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 449471589
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc73418bd52c0694a19af6083331d7a4a133f36616e77cb56fc9fc0bb18ad264
|
3 |
size 449471589
|
last-checkpoint/rng_state_0.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3cbe84c4b275ece4dfc8b045971a9447b9468599c6de1ac7856d818ab7fcce6
|
3 |
size 14503
|
last-checkpoint/rng_state_1.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ca4b049386ceb25b5284b9754462b13ddabb069762bc1b4ce1a9e94d95e348c
|
3 |
size 14503
|
last-checkpoint/rng_state_2.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:733172b1d4a99d1dcac219cdba47537d2e3c42c728e60a468833c7a7eb409d93
|
3 |
size 14503
|
last-checkpoint/rng_state_3.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14503
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1a20d0d880982442a49c1adeca0b36b7c4aa9ce9768b58e40b03f2358d78bf3
|
3 |
size 14503
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2358905887cd0ce80c53b6e8a0174e039c4c5bd62c6c91c86f0312f9b46fcf7
|
3 |
size 623
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -7258,11 +7258,85 @@
|
|
7258 |
"eval_samples_per_second": 1335.226,
|
7259 |
"eval_steps_per_second": 21.364,
|
7260 |
"step": 980000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7261 |
}
|
7262 |
],
|
7263 |
"max_steps": 1000000,
|
7264 |
"num_train_epochs": 16,
|
7265 |
-
"total_flos": 6.
|
7266 |
"trial_name": null,
|
7267 |
"trial_params": null
|
7268 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 15.11750423748225,
|
5 |
+
"global_step": 990000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
7258 |
"eval_samples_per_second": 1335.226,
|
7259 |
"eval_steps_per_second": 21.364,
|
7260 |
"step": 980000
|
7261 |
+
},
|
7262 |
+
{
|
7263 |
+
"epoch": 14.98,
|
7264 |
+
"learning_rate": 1.0138129010020992e-05,
|
7265 |
+
"loss": 0.2272,
|
7266 |
+
"step": 981000
|
7267 |
+
},
|
7268 |
+
{
|
7269 |
+
"epoch": 15.0,
|
7270 |
+
"learning_rate": 1.0123975923584488e-05,
|
7271 |
+
"loss": 0.2273,
|
7272 |
+
"step": 982000
|
7273 |
+
},
|
7274 |
+
{
|
7275 |
+
"epoch": 15.01,
|
7276 |
+
"learning_rate": 1.0110586990152152e-05,
|
7277 |
+
"loss": 0.227,
|
7278 |
+
"step": 983000
|
7279 |
+
},
|
7280 |
+
{
|
7281 |
+
"epoch": 15.03,
|
7282 |
+
"learning_rate": 1.0097962356143219e-05,
|
7283 |
+
"loss": 0.2273,
|
7284 |
+
"step": 984000
|
7285 |
+
},
|
7286 |
+
{
|
7287 |
+
"epoch": 15.04,
|
7288 |
+
"learning_rate": 1.0086102159618668e-05,
|
7289 |
+
"loss": 0.227,
|
7290 |
+
"step": 985000
|
7291 |
+
},
|
7292 |
+
{
|
7293 |
+
"epoch": 15.04,
|
7294 |
+
"eval_runtime": 0.7868,
|
7295 |
+
"eval_samples_per_second": 1271.022,
|
7296 |
+
"eval_steps_per_second": 20.336,
|
7297 |
+
"step": 985000
|
7298 |
+
},
|
7299 |
+
{
|
7300 |
+
"epoch": 15.06,
|
7301 |
+
"learning_rate": 1.0075006530279694e-05,
|
7302 |
+
"loss": 0.2271,
|
7303 |
+
"step": 986000
|
7304 |
+
},
|
7305 |
+
{
|
7306 |
+
"epoch": 15.07,
|
7307 |
+
"learning_rate": 1.0064675589466339e-05,
|
7308 |
+
"loss": 0.2268,
|
7309 |
+
"step": 987000
|
7310 |
+
},
|
7311 |
+
{
|
7312 |
+
"epoch": 15.09,
|
7313 |
+
"learning_rate": 1.0055109450156098e-05,
|
7314 |
+
"loss": 0.2272,
|
7315 |
+
"step": 988000
|
7316 |
+
},
|
7317 |
+
{
|
7318 |
+
"epoch": 15.1,
|
7319 |
+
"learning_rate": 1.0046308216962759e-05,
|
7320 |
+
"loss": 0.2269,
|
7321 |
+
"step": 989000
|
7322 |
+
},
|
7323 |
+
{
|
7324 |
+
"epoch": 15.12,
|
7325 |
+
"learning_rate": 1.0038271986135177e-05,
|
7326 |
+
"loss": 0.2272,
|
7327 |
+
"step": 990000
|
7328 |
+
},
|
7329 |
+
{
|
7330 |
+
"epoch": 15.12,
|
7331 |
+
"eval_runtime": 0.7713,
|
7332 |
+
"eval_samples_per_second": 1296.438,
|
7333 |
+
"eval_steps_per_second": 20.743,
|
7334 |
+
"step": 990000
|
7335 |
}
|
7336 |
],
|
7337 |
"max_steps": 1000000,
|
7338 |
"num_train_epochs": 16,
|
7339 |
+
"total_flos": 6.939915985982136e+22,
|
7340 |
"trial_name": null,
|
7341 |
"trial_params": null
|
7342 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 449471589
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc73418bd52c0694a19af6083331d7a4a133f36616e77cb56fc9fc0bb18ad264
|
3 |
size 449471589
|