mamba-370m / config.json
mjschock's picture
Upload model
c01317d verified
raw
history blame contribute delete
No virus
515 Bytes
{
"architectures": [
"MambaModelForCausalLM"
],
"auto_map": {
"AutoConfig": "configuration_mamba.MambaConfig",
"AutoModel": "modeling_mamba.MambaModel",
"AutoModelForCausalLM": "modeling_mamba.MambaModelForCausalLM"
},
"d_model": 1024,
"fused_add_norm": true,
"model_type": "mamba",
"n_layer": 48,
"pad_vocab_size_multiple": 8,
"residual_in_fp32": true,
"rms_norm": true,
"ssm_cfg": {},
"torch_dtype": "float16",
"transformers_version": "4.37.2",
"vocab_size": 50277
}