silmi224 commited on
Commit
4131c04
1 Parent(s): 30aed59

Training in progress, step 10

Browse files
config.json CHANGED
@@ -24,7 +24,6 @@
24
  "decoder_layers": 6,
25
  "decoder_start_token_id": 2,
26
  "dropout": 0.1,
27
- "early_stopping": true,
28
  "encoder_attention_heads": 12,
29
  "encoder_ffn_dim": 3072,
30
  "encoder_layerdrop": 0.0,
@@ -45,8 +44,8 @@
45
  "length_penalty": 2.0,
46
  "max_decoder_position_embeddings": 1024,
47
  "max_encoder_position_embeddings": 16384,
48
- "max_length": 512,
49
- "min_length": 256,
50
  "model_type": "led",
51
  "no_repeat_ngram_size": 3,
52
  "num_beams": 2,
 
24
  "decoder_layers": 6,
25
  "decoder_start_token_id": 2,
26
  "dropout": 0.1,
 
27
  "encoder_attention_heads": 12,
28
  "encoder_ffn_dim": 3072,
29
  "encoder_layerdrop": 0.0,
 
44
  "length_penalty": 2.0,
45
  "max_decoder_position_embeddings": 1024,
46
  "max_encoder_position_embeddings": 16384,
47
+ "max_length": 256,
48
+ "min_length": 128,
49
  "model_type": "led",
50
  "no_repeat_ngram_size": 3,
51
  "num_beams": 2,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a105de7a2dcc684878dea5e6b0ed2b65207019f8d813f0bd3e1bae08d56fba54
3
  size 647614116
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7455581ba41b997039883a26eeeed258740e22133fe84af4edd90780e1497de
3
  size 647614116
runs/Jul07_02-45-31_56a5d84e66da/events.out.tfevents.1720320345.56a5d84e66da.34.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cca0dbc4871f3166c27d952f6129dd15ca6236d4a8c44097c9be0522aa85f6e
3
+ size 5797
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 512,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 512
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 256,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 256
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5916a8649818649a2a5f89d99b862d6173b7cc4bd8c9d8819eb325d8604b6f55
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:518e3ea9bbfadf8f6f9a2e00e8c2f104262a2aea08ed9eb73247c938438ff5b6
3
  size 5240