{ | |
"architecture": "WhisperEncoder", | |
"dtype": "float16", | |
"num_hidden_layers": 6, | |
"num_attention_heads": 8, | |
"hidden_size": 512, | |
"max_position_embeddings": 1500, | |
"has_position_embedding": true, | |
"n_mels": 80, | |
"vocab_size": 51864, | |
"hidden_act": "gelu", | |
"num_languages": 99, | |
"quantization": { | |
"quant_algo": null | |
} | |
} |