mamba2-130m / config.json
km
Model release
3a5aea0
raw
history blame
No virus
330 Bytes
{
"d_model": 768,
"d_intermediate": 0,
"n_layer": 24,
"vocab_size": 50277,
"ssm_cfg": {
"layer": "Mamba2"
},
"attn_layer_idx": [],
"attn_cfg": {},
"rms_norm": true,
"residual_in_fp32": true,
"fused_add_norm": true,
"pad_vocab_size_multiple": 16,
"tie_embeddings": true
}