{ | |
"architectures": [ | |
"XvectorModel" | |
], | |
"auto_map": { | |
"AutoConfig": "configuration_xvector.XvectorConfig", | |
"AutoModel": "modeling_xvector.XvectorModel", | |
"AutoModelForAudioClassification": "modeling_xvector.XvectorModelForSequenceClassification" | |
}, | |
"hidden_size": 512, | |
"hop_length": 10, | |
"initializer_range": 0.02, | |
"loss_fn": "aam", | |
"mean_norm": true, | |
"model_type": "xvector", | |
"n_mels": 40, | |
"norm_type": "sentence", | |
"num_classes": 5994, | |
"sample_rate": 16000, | |
"std_norm": false, | |
"tdnn_blocks": 5, | |
"tdnn_channels": [ | |
512, | |
512, | |
512, | |
512, | |
1500 | |
], | |
"tdnn_dilations": [ | |
1, | |
2, | |
3, | |
1, | |
1 | |
], | |
"tdnn_kernel_sizes": [ | |
5, | |
3, | |
3, | |
1, | |
1 | |
], | |
"torch_dtype": "float32", | |
"transformers_version": "4.31.0", | |
"win_length": 25 | |
} | |