Cxxs commited on
Commit
220b99e
1 Parent(s): c288fed

Upload 3 files

Browse files
finetune/mm/SPHINX/SPHINX-MoE/config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dim": 4096,
3
+ "hidden_dim": 14336,
4
+ "head_dim": 128,
5
+ "n_layers": 32,
6
+ "n_heads": 32,
7
+ "n_kv_heads": 8,
8
+ "vocab_size": 32000,
9
+ "norm_eps": 1e-05,
10
+ "rope_theta": 1000000,
11
+ "max_batch_size": 32,
12
+ "max_seq_len": 4096,
13
+ "moe": {
14
+ "num_experts_per_tok": 2,
15
+ "num_experts": 8
16
+ },
17
+ "load_balancing_weight": 0.1,
18
+ "rope_scaling": null,
19
+ "load_pretrained_visual_encoder": false
20
+ }
finetune/mm/SPHINX/SPHINX-MoE/meta.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "llama_type": "mistral_sparse_ens"
3
+ }
finetune/mm/SPHINX/SPHINX-MoE/tokenizer.model ADDED
Binary file (493 kB). View file