arxyzan commited on
Commit
035cb20
1 Parent(s): 92672e9

Hezar: Upload model and config

Browse files
Files changed (1) hide show
  1. config.yaml +17 -0
config.yaml ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: distilbert_lm
2
+ task: language_modeling
3
+ activation: gelu
4
+ attention_dropout: 0.1
5
+ dim: 768
6
+ dropout: 0.1
7
+ hidden_dim: 3072
8
+ initializer_range: 0.02
9
+ max_position_embeddings: 512
10
+ model_type: distilbert
11
+ n_heads: 12
12
+ n_layers: 6
13
+ output_past: true
14
+ pad_token_id: 0
15
+ qa_dropout: 0.1
16
+ tie_weights_: true
17
+ vocab_size: 42000