{ "architecture": "WhisperEncoder", "dtype": "float16", "num_hidden_layers": 6, "num_attention_heads": 8, "hidden_size": 512, "max_position_embeddings": 1500, "has_position_embedding": true, "n_mels": 80, "vocab_size": 51864, "hidden_act": "gelu", "num_languages": 99, "quantization": { "quant_algo": null } }