{ "architecture": "WhisperEncoder", "dtype": "float16", "num_hidden_layers": 32, "num_attention_heads": 20, "hidden_size": 1280, "max_position_embeddings": 1500, "has_position_embedding": true, "n_mels": 128, "vocab_size": 51866, "hidden_act": "gelu", "num_languages": 100, "quantization": { "quant_algo": null } }