Training in progress, step 6000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +39 -3
- pytorch_model.bin +1 -1
- runs/Jun01_08-15-55_7b8f3300e052/events.out.tfevents.1685608114.7b8f3300e052.20157.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2023671531
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbba5bbb1b84435fdf4b936453e1a9a1c7392c1a15c1565a0f55dad61b600519
|
3 |
size 2023671531
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1014236857
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0cca5310b3c6412f68c93da53730bce4f0499a92d2e73c914d211907ca203c6
|
3 |
size 1014236857
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66d523033a195fd4e9b50639cc4c9fbcdcc6bcaffcba88c0b16f9c68a632d384
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7b1d42097f30e62e33d325ebb7425a02f7706c3c1da9e8f212c30114570be17
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -186,11 +186,47 @@
|
|
186 |
"eval_samples_per_second": 2.924,
|
187 |
"eval_steps_per_second": 0.372,
|
188 |
"step": 5000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
189 |
}
|
190 |
],
|
191 |
"max_steps": 11700,
|
192 |
"num_train_epochs": 300,
|
193 |
-
"total_flos":
|
194 |
"trial_name": null,
|
195 |
"trial_params": null
|
196 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 153.84615384615384,
|
5 |
+
"global_step": 6000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
186 |
"eval_samples_per_second": 2.924,
|
187 |
"eval_steps_per_second": 0.372,
|
188 |
"step": 5000
|
189 |
+
},
|
190 |
+
{
|
191 |
+
"epoch": 141.03,
|
192 |
+
"learning_rate": 3.197938144329897e-05,
|
193 |
+
"loss": 0.0904,
|
194 |
+
"step": 5500
|
195 |
+
},
|
196 |
+
{
|
197 |
+
"epoch": 141.03,
|
198 |
+
"eval_bleu": 94.4101,
|
199 |
+
"eval_em": 0.0719,
|
200 |
+
"eval_gen_len": 58.2518,
|
201 |
+
"eval_loss": 0.34235823154449463,
|
202 |
+
"eval_rm": 0.1439,
|
203 |
+
"eval_runtime": 139.5842,
|
204 |
+
"eval_samples_per_second": 2.987,
|
205 |
+
"eval_steps_per_second": 0.38,
|
206 |
+
"step": 5500
|
207 |
+
},
|
208 |
+
{
|
209 |
+
"epoch": 153.85,
|
210 |
+
"learning_rate": 2.9402061855670106e-05,
|
211 |
+
"loss": 0.0833,
|
212 |
+
"step": 6000
|
213 |
+
},
|
214 |
+
{
|
215 |
+
"epoch": 153.85,
|
216 |
+
"eval_bleu": 94.7141,
|
217 |
+
"eval_em": 0.0887,
|
218 |
+
"eval_gen_len": 59.0312,
|
219 |
+
"eval_loss": 0.3461511433124542,
|
220 |
+
"eval_rm": 0.1775,
|
221 |
+
"eval_runtime": 137.4141,
|
222 |
+
"eval_samples_per_second": 3.035,
|
223 |
+
"eval_steps_per_second": 0.386,
|
224 |
+
"step": 6000
|
225 |
}
|
226 |
],
|
227 |
"max_steps": 11700,
|
228 |
"num_train_epochs": 300,
|
229 |
+
"total_flos": 4840863271495680.0,
|
230 |
"trial_name": null,
|
231 |
"trial_params": null
|
232 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1014236857
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a0cca5310b3c6412f68c93da53730bce4f0499a92d2e73c914d211907ca203c6
|
3 |
size 1014236857
|
runs/Jun01_08-15-55_7b8f3300e052/events.out.tfevents.1685608114.7b8f3300e052.20157.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8e380f641e60e47416c9ef8be040e10b17e40ec679df6b8213d182a3e4238dc
|
3 |
+
size 15985
|