matthewkenney commited on
Commit
ad882a1
1 Parent(s): 85fa03a

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +5 -6
config.json CHANGED
@@ -2,20 +2,19 @@
2
  "_name_or_path": "microsoft/phi-1_5",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
- "PhiForCausalLM"
6
  ],
7
  "attn_pdrop": 0.0,
8
  "auto_map": {
9
- "AutoConfig": "microsoft/phi-1_5--configuration_phi.PhiConfig",
10
- "AutoModelForCausalLM": "microsoft/phi-1_5--modeling_phi.PhiForCausalLM"
11
  },
12
  "embd_pdrop": 0.0,
13
- "flash_attn": false,
14
  "flash_rotary": false,
15
  "fused_dense": false,
16
  "initializer_range": 0.02,
17
  "layer_norm_epsilon": 1e-05,
18
- "model_type": "phi",
19
  "n_embd": 2048,
20
  "n_head": 32,
21
  "n_head_kv": null,
@@ -26,6 +25,6 @@
26
  "rotary_dim": 32,
27
  "tie_word_embeddings": false,
28
  "torch_dtype": "float16",
29
- "transformers_version": "4.35.2",
30
  "vocab_size": 51200
31
  }
 
2
  "_name_or_path": "microsoft/phi-1_5",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
+ "MixFormerSequentialForCausalLM"
6
  ],
7
  "attn_pdrop": 0.0,
8
  "auto_map": {
9
+ "AutoConfig": "microsoft/phi-1_5--configuration_mixformer_sequential.MixFormerSequentialConfig",
10
+ "AutoModelForCausalLM": "microsoft/phi-1_5--modeling_mixformer_sequential.MixFormerSequentialForCausalLM"
11
  },
12
  "embd_pdrop": 0.0,
 
13
  "flash_rotary": false,
14
  "fused_dense": false,
15
  "initializer_range": 0.02,
16
  "layer_norm_epsilon": 1e-05,
17
+ "model_type": "mixformer-sequential",
18
  "n_embd": 2048,
19
  "n_head": 32,
20
  "n_head_kv": null,
 
25
  "rotary_dim": 32,
26
  "tie_word_embeddings": false,
27
  "torch_dtype": "float16",
28
+ "transformers_version": "4.35.1",
29
  "vocab_size": 51200
30
  }