1 {
2 "activation": "gelu",
3 "attention_dropout": 0.1,
4 "dim": 768,
5 "dropout": 0.1,
6 "hidden_dim": 3072,
7 "initializer_range": 0.02,
8 "max_position_embeddings": 512,
9 "model_type": "distilbert",
10 "n_heads": 12,
11 "n_layers": 6,
12 "output_past": true,
13 "pad_token_id": 0,
14 "qa_dropout": 0.1,
15 "seq_classif_dropout": 0.2,
16 "sinusoidal_pos_embds": false,
17 "tie_weights_": true,
18 "vocab_size": 28996
19 }
20