Tongjilibo commited on
Commit
5ad53e1
1 Parent(s): c58ebc4

add roformer_chinese_sim_char_small

Browse files
roformer_chinese_sim_char_ft_small/bert4torch_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "attention_probs_dropout_prob": 0.1,
3
+ "hidden_act": "gelu",
4
+ "hidden_dropout_prob": 0.1,
5
+ "max_position_embeddings": 512,
6
+ "hidden_size": 384,
7
+ "initializer_range": 0.02,
8
+ "intermediate_size": 1536,
9
+ "layer_norm_eps": 1e-12,
10
+ "model": "roformer",
11
+ "num_attention_heads": 6,
12
+ "num_hidden_layers": 6,
13
+ "pad_token_id": 0,
14
+ "type_vocab_size": 2,
15
+ "vocab_size": 12000,
16
+ "is_decoder": true,
17
+ "eos_token_id": 102,
18
+ "with_pool": "linear",
19
+ "pool_strategy": "pooler"
20
+ }
roformer_chinese_sim_char_small/bert4torch_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "attention_probs_dropout_prob": 0.1,
3
+ "hidden_act": "gelu",
4
+ "hidden_dropout_prob": 0.1,
5
+ "max_position_embeddings": 512,
6
+ "hidden_size": 384,
7
+ "initializer_range": 0.02,
8
+ "intermediate_size": 1536,
9
+ "layer_norm_eps": 1e-12,
10
+ "model": "roformer",
11
+ "num_attention_heads": 6,
12
+ "num_hidden_layers": 6,
13
+ "pad_token_id": 0,
14
+ "type_vocab_size": 2,
15
+ "vocab_size": 12000,
16
+ "is_decoder": true,
17
+ "eos_token_id": 102,
18
+ "with_pool": "linear",
19
+ "pool_strategy": "pooler"
20
+ }