Gunulhona commited on
Commit
c51c512
1 Parent(s): d7a37ad

Upload BartForConditionalGeneration

Browse files
Files changed (3) hide show
  1. config.json +4 -4
  2. generation_config.json +9 -0
  3. pytorch_model.bin +2 -2
config.json CHANGED
@@ -5,16 +5,16 @@
5
  "BartForConditionalGeneration"
6
  ],
7
  "attention_dropout": 0.0,
8
- "bos_token_id": 0,
9
  "classifier_dropout": 0.0,
10
  "d_model": 768,
11
  "decoder_attention_heads": 12,
12
  "decoder_ffn_dim": 4096,
13
  "decoder_layerdrop": 0.0,
14
- "decoder_layers": 9,
15
  "decoder_start_token_id": 2,
16
  "dropout": 0.1,
17
- "encoder_attention_heads": 12,
18
  "encoder_ffn_dim": 4096,
19
  "encoder_layerdrop": 0.0,
20
  "encoder_layers": 3,
@@ -38,7 +38,7 @@
38
  "pad_token_id": 3,
39
  "scale_embedding": false,
40
  "torch_dtype": "float32",
41
- "transformers_version": "4.18.0",
42
  "use_cache": true,
43
  "vocab_size": 30000
44
  }
 
5
  "BartForConditionalGeneration"
6
  ],
7
  "attention_dropout": 0.0,
8
+ "bos_token_id": 2,
9
  "classifier_dropout": 0.0,
10
  "d_model": 768,
11
  "decoder_attention_heads": 12,
12
  "decoder_ffn_dim": 4096,
13
  "decoder_layerdrop": 0.0,
14
+ "decoder_layers": 6,
15
  "decoder_start_token_id": 2,
16
  "dropout": 0.1,
17
+ "encoder_attention_heads": 24,
18
  "encoder_ffn_dim": 4096,
19
  "encoder_layerdrop": 0.0,
20
  "encoder_layers": 3,
 
38
  "pad_token_id": 3,
39
  "scale_embedding": false,
40
  "torch_dtype": "float32",
41
+ "transformers_version": "4.26.0",
42
  "use_cache": true,
43
  "vocab_size": 30000
44
  }
generation_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "decoder_start_token_id": 2,
5
+ "eos_token_id": 2,
6
+ "forced_eos_token_id": 2,
7
+ "pad_token_id": 3,
8
+ "transformers_version": "4.26.0"
9
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:46f6dcae927523dda05b201230e5b6988995d7df72c5ea6472c4a3a13b427fc1
3
- size 599565821
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35e591d7889119520065668adbf93c59e79181f31c2e0a6d455b4524a01a9cb1
3
+ size 467234589