voiceclap-small / config.json
gijs's picture
Initial release: VoiceCLAP-Small (BUD-E-Whisper + MiniLM, dual-tower CLAP, 1 epoch on voiceclap_10)
f5fcbcd verified
raw
history blame contribute delete
645 Bytes
{
"architectures": [
"VoiceCLAPSmall"
],
"dtype": "float32",
"embed_dim": 768,
"model_type": "voiceclap-small",
"n_ctx": 1500,
"n_head": 12,
"n_layer": 12,
"n_mels": 80,
"n_state": 768,
"text_hidden_dim": 384,
"text_intermediate_size": 1536,
"text_layer_norm_eps": 1e-12,
"text_max_position_embeddings": 512,
"text_num_heads": 12,
"text_num_layers": 6,
"text_pad_token_id": 0,
"text_proj_hidden": 576,
"text_vocab_size": 30522,
"transformers_version": "5.7.0",
"auto_map": {
"AutoConfig": "configuration_voiceclap.VoiceCLAPSmallConfig",
"AutoModel": "modeling_voiceclap.VoiceCLAPSmall"
}
}