Training in progress, step 5000
Browse files- last-checkpoint/generation_config.json +6 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/tokenizer.json +6 -1
- last-checkpoint/trainer_state.json +24 -0
- last-checkpoint/training_args.bin +1 -1
- runs/May23_07-36-34_dca52c8e2827/events.out.tfevents.1684827413.dca52c8e2827.7053.0 +2 -2
- runs/May23_08-30-43_dca52c8e2827/1684830663.0701513/events.out.tfevents.1684830663.dca52c8e2827.20947.1 +3 -0
- runs/May23_08-30-43_dca52c8e2827/events.out.tfevents.1684830663.dca52c8e2827.20947.0 +3 -0
- runs/May23_08-52-00_dca52c8e2827/1684831937.796584/events.out.tfevents.1684831937.dca52c8e2827.26281.1 +3 -0
- runs/May23_08-52-00_dca52c8e2827/events.out.tfevents.1684831937.dca52c8e2827.26281.0 +3 -0
- runs/May23_09-05-35_dca52c8e2827/1684832750.9667075/events.out.tfevents.1684832750.dca52c8e2827.29730.1 +3 -0
- runs/May23_09-05-35_dca52c8e2827/events.out.tfevents.1684832750.dca52c8e2827.29730.0 +3 -0
- tokenizer.json +6 -1
- training_args.bin +1 -1
last-checkpoint/generation_config.json
CHANGED
@@ -1,5 +1,10 @@
|
|
1 |
{
|
2 |
-
"
|
|
|
|
|
|
|
|
|
|
|
3 |
"pad_token_id": 0,
|
4 |
"transformers_version": "4.30.0.dev0"
|
5 |
}
|
|
|
1 |
{
|
2 |
+
"decoder_start_token_id": 101,
|
3 |
+
"early_stopping": true,
|
4 |
+
"eos_token_id": 102,
|
5 |
+
"max_length": 256,
|
6 |
+
"min_length": 16,
|
7 |
+
"num_beams": 10,
|
8 |
"pad_token_id": 0,
|
9 |
"transformers_version": "4.30.0.dev0"
|
10 |
}
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b06473226c5124a3c55575628e48413a733d11d58cede4589852b479bbad85a
|
3 |
size 14575
|
last-checkpoint/tokenizer.json
CHANGED
@@ -1,6 +1,11 @@
|
|
1 |
{
|
2 |
"version": "1.0",
|
3 |
-
"truncation":
|
|
|
|
|
|
|
|
|
|
|
4 |
"padding": null,
|
5 |
"added_tokens": [
|
6 |
{
|
|
|
1 |
{
|
2 |
"version": "1.0",
|
3 |
+
"truncation": {
|
4 |
+
"direction": "Right",
|
5 |
+
"max_length": 256,
|
6 |
+
"strategy": "LongestFirst",
|
7 |
+
"stride": 0
|
8 |
+
},
|
9 |
"padding": null,
|
10 |
"added_tokens": [
|
11 |
{
|
last-checkpoint/trainer_state.json
CHANGED
@@ -127,6 +127,18 @@
|
|
127 |
"loss": 7.2445,
|
128 |
"step": 2000
|
129 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
130 |
{
|
131 |
"epoch": 0.87,
|
132 |
"learning_rate": 4.2e-05,
|
@@ -247,6 +259,18 @@
|
|
247 |
"loss": 3.4458,
|
248 |
"step": 4000
|
249 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
250 |
{
|
251 |
"epoch": 1.7,
|
252 |
"learning_rate": 4.62962962962963e-05,
|
|
|
127 |
"loss": 7.2445,
|
128 |
"step": 2000
|
129 |
},
|
130 |
+
{
|
131 |
+
"epoch": 0.83,
|
132 |
+
"eval_bleu": 1.523,
|
133 |
+
"eval_em": 0.0,
|
134 |
+
"eval_gen_len": 204.48,
|
135 |
+
"eval_loss": 7.561939239501953,
|
136 |
+
"eval_rm": NaN,
|
137 |
+
"eval_runtime": 100.5427,
|
138 |
+
"eval_samples_per_second": 0.497,
|
139 |
+
"eval_steps_per_second": 0.07,
|
140 |
+
"step": 2000
|
141 |
+
},
|
142 |
{
|
143 |
"epoch": 0.87,
|
144 |
"learning_rate": 4.2e-05,
|
|
|
259 |
"loss": 3.4458,
|
260 |
"step": 4000
|
261 |
},
|
262 |
+
{
|
263 |
+
"epoch": 1.66,
|
264 |
+
"eval_bleu": 16.0372,
|
265 |
+
"eval_em": 0.0,
|
266 |
+
"eval_gen_len": 76.36,
|
267 |
+
"eval_loss": 3.4201648235321045,
|
268 |
+
"eval_rm": NaN,
|
269 |
+
"eval_runtime": 91.7678,
|
270 |
+
"eval_samples_per_second": 0.545,
|
271 |
+
"eval_steps_per_second": 0.076,
|
272 |
+
"step": 4000
|
273 |
+
},
|
274 |
{
|
275 |
"epoch": 1.7,
|
276 |
"learning_rate": 4.62962962962963e-05,
|
last-checkpoint/training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4155
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1b9f4030acc1b98cd8fc39d52688ca9a4f11fa176fbaa30e9b52baf417f88e0
|
3 |
size 4155
|
runs/May23_07-36-34_dca52c8e2827/events.out.tfevents.1684827413.dca52c8e2827.7053.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3f83a66e95d5f33817f9ee4be32d84953f019adbeb0377410813c55d0def778
|
3 |
+
size 21103
|
runs/May23_08-30-43_dca52c8e2827/1684830663.0701513/events.out.tfevents.1684830663.dca52c8e2827.20947.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c6959a247c1585714935f4eb8ee763f03ad6c96be5754256b88193487b4bc99c
|
3 |
+
size 6302
|
runs/May23_08-30-43_dca52c8e2827/events.out.tfevents.1684830663.dca52c8e2827.20947.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:311767715bc109a71e2eb7f9d3cd7c74c99660f14c361719c0462fa940b1ab60
|
3 |
+
size 9326
|
runs/May23_08-52-00_dca52c8e2827/1684831937.796584/events.out.tfevents.1684831937.dca52c8e2827.26281.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cc25e01d7b09af47ad117dadb996bf4e428d5d68efba721d74cae83ae50d1f0
|
3 |
+
size 6302
|
runs/May23_08-52-00_dca52c8e2827/events.out.tfevents.1684831937.dca52c8e2827.26281.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42247893c8ef327ac95ad581fb6a123528e91d89aaef89640a5acd0fa747419d
|
3 |
+
size 11682
|
runs/May23_09-05-35_dca52c8e2827/1684832750.9667075/events.out.tfevents.1684832750.dca52c8e2827.29730.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f90cc25bae2b073583e4730b049c59eef6fcbd0dd6fca70cdf1e54e443049e36
|
3 |
+
size 6302
|
runs/May23_09-05-35_dca52c8e2827/events.out.tfevents.1684832750.dca52c8e2827.29730.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:efe972f716c107f17b5f0450067f792b88cf1332f5ee653ec460d6839296fd6f
|
3 |
+
size 17316
|
tokenizer.json
CHANGED
@@ -1,6 +1,11 @@
|
|
1 |
{
|
2 |
"version": "1.0",
|
3 |
-
"truncation":
|
|
|
|
|
|
|
|
|
|
|
4 |
"padding": null,
|
5 |
"added_tokens": [
|
6 |
{
|
|
|
1 |
{
|
2 |
"version": "1.0",
|
3 |
+
"truncation": {
|
4 |
+
"direction": "Right",
|
5 |
+
"max_length": 256,
|
6 |
+
"strategy": "LongestFirst",
|
7 |
+
"stride": 0
|
8 |
+
},
|
9 |
"padding": null,
|
10 |
"added_tokens": [
|
11 |
{
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4155
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1b9f4030acc1b98cd8fc39d52688ca9a4f11fa176fbaa30e9b52baf417f88e0
|
3 |
size 4155
|