Edward Gow-Smith
added model f2dba93
1 {
2 "_name_or_path": "results/xlnet-base-cased-FalseTrue0-1",
3 "architectures": [
4 "XLNetForSequenceClassification"
5 ],
6 "attn_type": "bi",
7 "bi_data": false,
8 "bos_token_id": 1,
9 "clamp_len": -1,
10 "d_head": 64,
11 "d_inner": 3072,
12 "d_model": 768,
13 "dropout": 0.1,
14 "end_n_top": 5,
15 "eos_token_id": 2,
16 "ff_activation": "gelu",
17 "initializer_range": 0.02,
18 "layer_norm_eps": 1e-12,
19 "mem_len": null,
20 "model_type": "xlnet",
21 "n_head": 12,
22 "n_layer": 12,
23 "pad_token_id": 5,
24 "reuse_len": null,
25 "same_length": false,
26 "start_n_top": 5,
27 "summary_activation": "tanh",
28 "summary_last_dropout": 0.1,
29 "summary_type": "last",
30 "summary_use_proj": true,
31 "task_specific_params": {
32 "text-generation": {
33 "do_sample": true,
34 "max_length": 250
35 }
36 },
37 "transformers_version": "4.6.0.dev0",
38 "untie_r": true,
39 "use_mems_eval": true,
40 "use_mems_train": false,
41 "vocab_size": 32000
42 }
43