Muennighoff commited on
Commit
5c3059f
1 Parent(s): 1e22ca5

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +7 -2
config.json CHANGED
@@ -1,8 +1,14 @@
1
  {
2
- "_name_or_path": "/data/niklas/sgpt2/sgpt2_m8x7_bs256_1253_token03",
 
3
  "architectures": [
4
  "MixtralForCausalLM"
5
  ],
 
 
 
 
 
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 2,
@@ -11,7 +17,6 @@
11
  "initializer_range": 0.02,
12
  "intermediate_size": 14336,
13
  "max_position_embeddings": 32768,
14
- "model_type": "mixtral",
15
  "num_attention_heads": 32,
16
  "num_experts_per_tok": 2,
17
  "num_hidden_layers": 32,
 
1
  {
2
+ "_name_or_path": "GritLM/GritLM-8x7B",
3
+ "model_type": "mixtral",
4
  "architectures": [
5
  "MixtralForCausalLM"
6
  ],
7
+ "auto_map": {
8
+ "AutoModel": "modeling_gritlm8x7b.MixtralModel",
9
+ "AutoModelForCausalLM": "modeling_gritlm8x7b.MixtralForCausalLM",
10
+ "AutoModelForSequenceClassification": "modeling_gritlm8x7b.MixtralForSequenceClassification"
11
+ },
12
  "attention_dropout": 0.0,
13
  "bos_token_id": 1,
14
  "eos_token_id": 2,
 
17
  "initializer_range": 0.02,
18
  "intermediate_size": 14336,
19
  "max_position_embeddings": 32768,
 
20
  "num_attention_heads": 32,
21
  "num_experts_per_tok": 2,
22
  "num_hidden_layers": 32,