Training in progress, step 10
Browse files
config.json
CHANGED
@@ -24,7 +24,6 @@
|
|
24 |
"decoder_layers": 6,
|
25 |
"decoder_start_token_id": 2,
|
26 |
"dropout": 0.1,
|
27 |
-
"early_stopping": true,
|
28 |
"encoder_attention_heads": 12,
|
29 |
"encoder_ffn_dim": 3072,
|
30 |
"encoder_layerdrop": 0.0,
|
@@ -45,8 +44,8 @@
|
|
45 |
"length_penalty": 2.0,
|
46 |
"max_decoder_position_embeddings": 1024,
|
47 |
"max_encoder_position_embeddings": 16384,
|
48 |
-
"max_length":
|
49 |
-
"min_length":
|
50 |
"model_type": "led",
|
51 |
"no_repeat_ngram_size": 3,
|
52 |
"num_beams": 2,
|
|
|
24 |
"decoder_layers": 6,
|
25 |
"decoder_start_token_id": 2,
|
26 |
"dropout": 0.1,
|
|
|
27 |
"encoder_attention_heads": 12,
|
28 |
"encoder_ffn_dim": 3072,
|
29 |
"encoder_layerdrop": 0.0,
|
|
|
44 |
"length_penalty": 2.0,
|
45 |
"max_decoder_position_embeddings": 1024,
|
46 |
"max_encoder_position_embeddings": 16384,
|
47 |
+
"max_length": 256,
|
48 |
+
"min_length": 128,
|
49 |
"model_type": "led",
|
50 |
"no_repeat_ngram_size": 3,
|
51 |
"num_beams": 2,
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 647614116
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7455581ba41b997039883a26eeeed258740e22133fe84af4edd90780e1497de
|
3 |
size 647614116
|
runs/Jul07_02-45-31_56a5d84e66da/events.out.tfevents.1720320345.56a5d84e66da.34.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cca0dbc4871f3166c27d952f6129dd15ca6236d4a8c44097c9be0522aa85f6e
|
3 |
+
size 5797
|
tokenizer.json
CHANGED
@@ -2,13 +2,13 @@
|
|
2 |
"version": "1.0",
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
-
"max_length":
|
6 |
"strategy": "LongestFirst",
|
7 |
"stride": 0
|
8 |
},
|
9 |
"padding": {
|
10 |
"strategy": {
|
11 |
-
"Fixed":
|
12 |
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
|
|
2 |
"version": "1.0",
|
3 |
"truncation": {
|
4 |
"direction": "Right",
|
5 |
+
"max_length": 256,
|
6 |
"strategy": "LongestFirst",
|
7 |
"stride": 0
|
8 |
},
|
9 |
"padding": {
|
10 |
"strategy": {
|
11 |
+
"Fixed": 256
|
12 |
},
|
13 |
"direction": "Right",
|
14 |
"pad_to_multiple_of": null,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5240
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:518e3ea9bbfadf8f6f9a2e00e8c2f104262a2aea08ed9eb73247c938438ff5b6
|
3 |
size 5240
|