Tongjilibo commited on
Commit
1dfa574
1 Parent(s): 77ef707

增加tranformer-xl

Browse files
transfo-xl-wt103/bert4torch_config.json ADDED
@@ -0,0 +1,51 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model": "transformer_xl",
3
+ "segment_vocab_size": 0,
4
+ "adaptive": true,
5
+ "attn_type": 0,
6
+ "clamp_len": 1000,
7
+ "cutoffs": [
8
+ 20000,
9
+ 40000,
10
+ 200000
11
+ ],
12
+ "d_embed": 1024,
13
+ "d_head": 64,
14
+ "intermediate_size": 4096,
15
+ "hidden_size": 1024,
16
+ "div_val": 4,
17
+ "is_dropout": true,
18
+ "adaptive_embedding": true,
19
+ "attention_probs_dropout_prob": 0.0,
20
+ "hidden_dropout_prob": 0.1,
21
+ "hidden_act": "relu",
22
+ "eos_token_id": 0,
23
+ "ext_len": 0,
24
+ "init": "normal",
25
+ "init_range": 0.01,
26
+ "init_std": 0.02,
27
+ "layer_norm_epsilon": 1e-05,
28
+ "mem_len": 1600,
29
+ "num_attention_heads": 16,
30
+ "num_hidden_layers": 18,
31
+ "pre_layernorm": false,
32
+ "proj_init_std": 0.01,
33
+ "same_length": true,
34
+ "sample_softmax": -1,
35
+ "task_specific_params": {
36
+ "text-generation": {
37
+ "do_sample": true,
38
+ "max_length": 250
39
+ }
40
+ },
41
+ "tgt_len": 128,
42
+ "tie_projs": [
43
+ false,
44
+ true,
45
+ true,
46
+ true
47
+ ],
48
+ "tie_weight": true,
49
+ "untie_r": true,
50
+ "vocab_size": 267735
51
+ }