fuliucansheng commited on
Commit
1611438
1 Parent(s): 17fef65

mass base config update

Browse files
Files changed (1) hide show
  1. mass-base-uncased-config.json +27 -5
mass-base-uncased-config.json CHANGED
@@ -3,13 +3,35 @@
3
  "encoder_ffn_embed_dim": 3072,
4
  "encoder_attention_heads": 12,
5
  "encoder_layers": 6,
6
- "dropout": 0.1,
7
- "attention_dropout": 0.1,
8
- "activation_dropout": 0.1,
9
- "activation_fn": "gelu",
10
  "decoder_embed_dim": 768,
11
  "decoder_ffn_embed_dim": 3072,
12
- "decoder_attention_heads": 6,
13
  "decoder_layers": 6,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  "vocab_size": 30522
15
  }
3
  "encoder_ffn_embed_dim": 3072,
4
  "encoder_attention_heads": 12,
5
  "encoder_layers": 6,
6
+ "encoder_normalize_before": 0,
7
+ "encoder_learned_pos": 0,
8
+ "decoder_learned_pos": 0,
 
9
  "decoder_embed_dim": 768,
10
  "decoder_ffn_embed_dim": 3072,
 
11
  "decoder_layers": 6,
12
+ "decoder_attention_heads": 6,
13
+ "decoder_normalize_before": 0,
14
+ "attention_dropout": 0.1,
15
+ "activation_dropout": 0.1,
16
+ "activation_fn": "gelu",
17
+ "dropout": 0.1,
18
+ "adaptive_softmax_dropout": 0,
19
+ "share_decoder_input_output_embed": 1,
20
+ "share_all_embeddings": 1,
21
+ "no_token_positional_embeddings": 0,
22
+ "no_cross_attention": 0,
23
+ "cross_self_attention": 0,
24
+ "decoder_output_dim": 768,
25
+ "decoder_input_dim": 768,
26
+ "no_scale_embedding": 0,
27
+ "adaptive_input": 1,
28
+ "tie_adaptive_weights": 0,
29
+ "layernorm_embedding": 0,
30
+ "encoder_layerdrop": 0,
31
+ "decoder_layerdrop": 0,
32
+ "quant_noise_pq": 0,
33
+ "quant_noise_pq_block_size": 8,
34
+ "quant_noise_scalar": 0,
35
+ "is_encoder_decoder": 1,
36
  "vocab_size": 30522
37
  }