Patrick von Platen commited on
Commit
36e5036
1 Parent(s): f7f0882

correct models

Browse files
Files changed (3) hide show
  1. config.json +30 -2
  2. pytorch_model.bin +2 -2
  3. tf_model.h5 +2 -2
config.json CHANGED
@@ -14,13 +14,41 @@
14
  "is_encoder_decoder": true,
15
  "layer_norm_epsilon": 1e-06,
16
  "model_type": "t5",
 
17
  "num_decoder_layers": 24,
18
  "num_heads": 32,
19
  "num_layers": 24,
20
  "output_past": true,
21
  "pad_token_id": 0,
22
  "relative_attention_num_buckets": 32,
23
- "tie_word_embeddings": false,
24
- "tokenizer_class": "T5Tokenizer",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  "vocab_size": 32128
26
  }
14
  "is_encoder_decoder": true,
15
  "layer_norm_epsilon": 1e-06,
16
  "model_type": "t5",
17
+ "n_positions": 512,
18
  "num_decoder_layers": 24,
19
  "num_heads": 32,
20
  "num_layers": 24,
21
  "output_past": true,
22
  "pad_token_id": 0,
23
  "relative_attention_num_buckets": 32,
24
+ "task_specific_params": {
25
+ "summarization": {
26
+ "early_stopping": true,
27
+ "length_penalty": 2.0,
28
+ "max_length": 200,
29
+ "min_length": 30,
30
+ "no_repeat_ngram_size": 3,
31
+ "num_beams": 4,
32
+ "prefix": "summarize: "
33
+ },
34
+ "translation_en_to_de": {
35
+ "early_stopping": true,
36
+ "max_length": 300,
37
+ "num_beams": 4,
38
+ "prefix": "translate English to German: "
39
+ },
40
+ "translation_en_to_fr": {
41
+ "early_stopping": true,
42
+ "max_length": 300,
43
+ "num_beams": 4,
44
+ "prefix": "translate English to French: "
45
+ },
46
+ "translation_en_to_ro": {
47
+ "early_stopping": true,
48
+ "max_length": 300,
49
+ "num_beams": 4,
50
+ "prefix": "translate English to Romanian: "
51
+ }
52
+ },
53
  "vocab_size": 32128
54
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6334a3a1c71d8272fea59e25b95d7d98765d2407f49deca24f01bc6fb7d992e9
3
- size 11406629341
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb805163c662345cb7298519125bd6606544f63a6f63e94d7960f26a824f4de4
3
+ size 11406629461
tf_model.h5 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c3ab80377b37004b176e56820534832e7c18af0c391756dbf0ef224d25b5a2d
3
- size 11539032000
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5945a34124f8c7aef538b37abaff0faf6bc56bd96b1cd13acdbca184ad6a9baf
3
+ size 11407431672