Zyphra
/

Zamba2-2.7B

Text Generation

Inference Endpoints

Model card Files Files and versions Community

pglo commited on Aug 19, 2024

Commit

6df099f

·

verified ·

1 Parent(s): e8e00bd

Upload config.json

Files changed (1) hide show

config.json +7 -1

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "add_bias_linear": false,
   "architectures": [
     "Zamba2ForCausalLM"
@@ -69,8 +70,12 @@
     "m",
     "m"
   ],
   "lora_rank": 128,
   "mamba_headdim": 64,
   "model_type": "zamba2",
   "num_attention_heads": 32,
   "num_hidden_layers": 54,
@@ -86,5 +91,6 @@
   "use_cache": true,
   "use_mamba_kernels": true,
   "use_shared_block_lora": true,
-  "vocab_size": 32000
 }

 {
+  "_name_or_path": "Zyphra/Zamba2-2.7B",
   "add_bias_linear": false,
   "architectures": [
     "Zamba2ForCausalLM"
     "m",
     "m"
   ],
+  "num_mem_blocks": 2,
+  "max_position_embeddings": 4096,
   "lora_rank": 128,
   "mamba_headdim": 64,
+  "use_mem_rope": false,
+  "rope_theta": 10000,
   "model_type": "zamba2",
   "num_attention_heads": 32,
   "num_hidden_layers": 54,
   "use_cache": true,
   "use_mamba_kernels": true,
   "use_shared_block_lora": true,
+  "se_shared_attention_lora": false,
+  "vocab_size": 32001
 }