nicoladecao commited on
Commit
fb91897
1 Parent(s): 35971bd

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +9 -3
config.json CHANGED
@@ -1,14 +1,16 @@
1
  {
2
  "_name_or_path": "facebook/genre-kilt",
3
- "activation_dropout": 0.1,
4
  "activation_function": "gelu",
5
  "add_bias_logits": false,
6
  "add_final_layer_norm": false,
7
  "architectures": [
8
  "BartForConditionalGeneration"
9
  ],
10
- "attention_dropout": 0.1,
11
  "bos_token_id": 0,
 
 
12
  "d_model": 1024,
13
  "decoder_attention_heads": 16,
14
  "decoder_ffn_dim": 4096,
@@ -16,6 +18,7 @@
16
  "decoder_layers": 12,
17
  "decoder_start_token_id": 2,
18
  "dropout": 0.1,
 
19
  "encoder_attention_heads": 16,
20
  "encoder_ffn_dim": 4096,
21
  "encoder_layerdrop": 0.0,
@@ -33,9 +36,12 @@
33
  "min_length": 0,
34
  "model_type": "bart",
35
  "normalize_before": false,
36
- "normalize_embedding": true,
 
37
  "num_hidden_layers": 12,
 
38
  "pad_token_id": 1,
 
39
  "scale_embedding": false,
40
  "static_position_embeddings": false,
41
  "student_decoder_layers": null,
 
1
  {
2
  "_name_or_path": "facebook/genre-kilt",
3
+ "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "add_bias_logits": false,
6
  "add_final_layer_norm": false,
7
  "architectures": [
8
  "BartForConditionalGeneration"
9
  ],
10
+ "attention_dropout": 0.0,
11
  "bos_token_id": 0,
12
+ "classif_dropout": 0.0,
13
+ "classifier_dropout": 0.0,
14
  "d_model": 1024,
15
  "decoder_attention_heads": 16,
16
  "decoder_ffn_dim": 4096,
 
18
  "decoder_layers": 12,
19
  "decoder_start_token_id": 2,
20
  "dropout": 0.1,
21
+ "early_stopping": true,
22
  "encoder_attention_heads": 16,
23
  "encoder_ffn_dim": 4096,
24
  "encoder_layerdrop": 0.0,
 
36
  "min_length": 0,
37
  "model_type": "bart",
38
  "normalize_before": false,
39
+ "normalize_embedding": false,
40
+ "num_beams": 6,
41
  "num_hidden_layers": 12,
42
+ "output_past": true,
43
  "pad_token_id": 1,
44
+ "replacing_rate": 0,
45
  "scale_embedding": false,
46
  "static_position_embeddings": false,
47
  "student_decoder_layers": null,