Training in progress, step 5000
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +39 -3
- pytorch_model.bin +1 -1
- runs/Jun01_08-15-55_7b8f3300e052/events.out.tfevents.1685608114.7b8f3300e052.20157.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2023671531
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7442f9b1b8eaedb28a307ad821bc17333be1ec1db40df16dcb29c589292dd9a
|
3 |
size 2023671531
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1014236857
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c0dd95c892f20845c651adeb1edb1313f086fd7c6433880a52de996981d6d12
|
3 |
size 1014236857
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc379462a95446b799f519a1789df0c033332e48886b605cc7e0e41e902ed5eb
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ea22e1e3d580a233174f36b8254237ec9b07496557b5d4d59b4b19497a3dbac
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -150,11 +150,47 @@
|
|
150 |
"eval_samples_per_second": 3.061,
|
151 |
"eval_steps_per_second": 0.389,
|
152 |
"step": 4000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
153 |
}
|
154 |
],
|
155 |
"max_steps": 11700,
|
156 |
"num_train_epochs": 300,
|
157 |
-
"total_flos":
|
158 |
"trial_name": null,
|
159 |
"trial_params": null
|
160 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 128.2051282051282,
|
5 |
+
"global_step": 5000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
150 |
"eval_samples_per_second": 3.061,
|
151 |
"eval_steps_per_second": 0.389,
|
152 |
"step": 4000
|
153 |
+
},
|
154 |
+
{
|
155 |
+
"epoch": 115.38,
|
156 |
+
"learning_rate": 3.71340206185567e-05,
|
157 |
+
"loss": 0.0999,
|
158 |
+
"step": 4500
|
159 |
+
},
|
160 |
+
{
|
161 |
+
"epoch": 115.38,
|
162 |
+
"eval_bleu": 94.6291,
|
163 |
+
"eval_em": 0.0336,
|
164 |
+
"eval_gen_len": 58.6283,
|
165 |
+
"eval_loss": 0.3437003791332245,
|
166 |
+
"eval_rm": 0.0624,
|
167 |
+
"eval_runtime": 139.8829,
|
168 |
+
"eval_samples_per_second": 2.981,
|
169 |
+
"eval_steps_per_second": 0.379,
|
170 |
+
"step": 4500
|
171 |
+
},
|
172 |
+
{
|
173 |
+
"epoch": 128.21,
|
174 |
+
"learning_rate": 3.455670103092783e-05,
|
175 |
+
"loss": 0.0941,
|
176 |
+
"step": 5000
|
177 |
+
},
|
178 |
+
{
|
179 |
+
"epoch": 128.21,
|
180 |
+
"eval_bleu": 94.7896,
|
181 |
+
"eval_em": 0.0695,
|
182 |
+
"eval_gen_len": 58.4149,
|
183 |
+
"eval_loss": 0.351246178150177,
|
184 |
+
"eval_rm": 0.1271,
|
185 |
+
"eval_runtime": 142.599,
|
186 |
+
"eval_samples_per_second": 2.924,
|
187 |
+
"eval_steps_per_second": 0.372,
|
188 |
+
"step": 5000
|
189 |
}
|
190 |
],
|
191 |
"max_steps": 11700,
|
192 |
"num_train_epochs": 300,
|
193 |
+
"total_flos": 4028902164693120.0,
|
194 |
"trial_name": null,
|
195 |
"trial_params": null
|
196 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1014236857
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c0dd95c892f20845c651adeb1edb1313f086fd7c6433880a52de996981d6d12
|
3 |
size 1014236857
|
runs/Jun01_08-15-55_7b8f3300e052/events.out.tfevents.1685608114.7b8f3300e052.20157.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:396b3690fc05dd7fbcefb662e6a7101d7c99cf81c6f3ec3bf6980791cb736b80
|
3 |
+
size 14747
|