Training in progress, step 14000
Browse files
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1135685
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5a960b17798c7b8995ef1dc68fef82584cd48423ce850bd588f46544131a3c2
|
3 |
size 1135685
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 307910149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff885e6aadd3d270b0e549f68ea1bd5fb91a649e29371ed75f3a8d66d517cf10
|
3 |
size 307910149
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98b1a0e8363bd62d636fdf22f594afac04c65df8c87bec6bc026af1848ed19a5
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a9379299cb036bee8563adb6a6941350bd1a2187d737827bca0ce7b889d9885
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 1.7871696949005127,
|
3 |
"best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/google-flan-t5-small-e-snli-generation-label_and_explanation-selected-b64/checkpoint-2000",
|
4 |
-
"epoch": 1.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -138,11 +138,33 @@
|
|
138 |
"eval_samples_per_second": 64.983,
|
139 |
"eval_steps_per_second": 1.017,
|
140 |
"step": 12000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
141 |
}
|
142 |
],
|
143 |
"max_steps": 85840,
|
144 |
"num_train_epochs": 10,
|
145 |
-
"total_flos": 1.
|
146 |
"trial_name": null,
|
147 |
"trial_params": null
|
148 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 1.7871696949005127,
|
3 |
"best_model_checkpoint": "/home3/s5431786/nlp-final-project/results/google-flan-t5-small-e-snli-generation-label_and_explanation-selected-b64/checkpoint-2000",
|
4 |
+
"epoch": 1.6309412861136998,
|
5 |
+
"global_step": 14000,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
138 |
"eval_samples_per_second": 64.983,
|
139 |
"eval_steps_per_second": 1.017,
|
140 |
"step": 12000
|
141 |
+
},
|
142 |
+
{
|
143 |
+
"epoch": 1.63,
|
144 |
+
"learning_rate": 0.0008809535488301369,
|
145 |
+
"loss": 1.0846,
|
146 |
+
"step": 14000
|
147 |
+
},
|
148 |
+
{
|
149 |
+
"epoch": 1.63,
|
150 |
+
"eval_accuracy": 0.8750254013411908,
|
151 |
+
"eval_bertscore_f1": 0.9330909099915095,
|
152 |
+
"eval_bleu": 0.39881326611406565,
|
153 |
+
"eval_f1": 0.875070205358106,
|
154 |
+
"eval_loss": 1.832938551902771,
|
155 |
+
"eval_rouge1": 0.6061633599628911,
|
156 |
+
"eval_rouge2": 0.39694115489567416,
|
157 |
+
"eval_rougeL": 0.550297473532996,
|
158 |
+
"eval_rougeLsum": 0.5523036866159814,
|
159 |
+
"eval_runtime": 154.4147,
|
160 |
+
"eval_samples_per_second": 63.737,
|
161 |
+
"eval_steps_per_second": 0.997,
|
162 |
+
"step": 14000
|
163 |
}
|
164 |
],
|
165 |
"max_steps": 85840,
|
166 |
"num_train_epochs": 10,
|
167 |
+
"total_flos": 1.918701302527181e+16,
|
168 |
"trial_name": null,
|
169 |
"trial_params": null
|
170 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 307910149
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff885e6aadd3d270b0e549f68ea1bd5fb91a649e29371ed75f3a8d66d517cf10
|
3 |
size 307910149
|