Dmitriy007
commited on
Commit
•
0dfc9d5
1
Parent(s):
1a4dd9c
Training in progress, step 13000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +23 -3
- pytorch_model.bin +1 -1
- runs/Mar21_22-11-09_493485ec0ec3/events.out.tfevents.1679436700.493485ec0ec3.312.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2847145157
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b6a3d9e33c34ea1d3391821742ea024ee94084b1d553075d406903dd52423c4
|
3 |
size 2847145157
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1524261149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b977a1a74eff72c359c9b47436838d20528fe3e592056476cee45bbd479b6e0
|
3 |
size 1524261149
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ee339a4fc3a8b6ac6ae41adbcc1dd718e6ba617469347b728b801f63f50c9ba
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1718b0559d4dd537c5c85c5595b1dc69c046d65cf532260c2e15ed363c16b827
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 3.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -246,11 +246,31 @@
|
|
246 |
"eval_samples_per_second": 14.754,
|
247 |
"eval_steps_per_second": 4.92,
|
248 |
"step": 12000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
249 |
}
|
250 |
],
|
251 |
"max_steps": 19990,
|
252 |
"num_train_epochs": 5,
|
253 |
-
"total_flos": 1.
|
254 |
"trial_name": null,
|
255 |
"trial_params": null
|
256 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 3.251625812906453,
|
5 |
+
"global_step": 13000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
246 |
"eval_samples_per_second": 14.754,
|
247 |
"eval_steps_per_second": 4.92,
|
248 |
"step": 12000
|
249 |
+
},
|
250 |
+
{
|
251 |
+
"epoch": 3.13,
|
252 |
+
"learning_rate": 7.493746873436719e-06,
|
253 |
+
"loss": 2.5308,
|
254 |
+
"step": 12500
|
255 |
+
},
|
256 |
+
{
|
257 |
+
"epoch": 3.25,
|
258 |
+
"learning_rate": 6.9934967483741875e-06,
|
259 |
+
"loss": 2.5445,
|
260 |
+
"step": 13000
|
261 |
+
},
|
262 |
+
{
|
263 |
+
"epoch": 3.25,
|
264 |
+
"eval_loss": 3.1546671390533447,
|
265 |
+
"eval_runtime": 143.5837,
|
266 |
+
"eval_samples_per_second": 14.744,
|
267 |
+
"eval_steps_per_second": 4.917,
|
268 |
+
"step": 13000
|
269 |
}
|
270 |
],
|
271 |
"max_steps": 19990,
|
272 |
"num_train_epochs": 5,
|
273 |
+
"total_flos": 1.839262703616e+16,
|
274 |
"trial_name": null,
|
275 |
"trial_params": null
|
276 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1524261149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b977a1a74eff72c359c9b47436838d20528fe3e592056476cee45bbd479b6e0
|
3 |
size 1524261149
|
runs/Mar21_22-11-09_493485ec0ec3/events.out.tfevents.1679436700.493485ec0ec3.312.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffeb798ef1b85fc50504ccec82bf30cfc29038e4cb4c5d4520bb78ea8da6c739
|
3 |
+
size 5967
|