{ "architectures": [ "XvectorModel" ], "auto_map": { "AutoConfig": "configuration_xvector.XvectorConfig", "AutoModel": "modeling_xvector.XvectorModel", "AutoModelForAudioClassification": "modeling_xvector.XvectorModelForSequenceClassification" }, "hidden_size": 512, "hop_length": 10, "initializer_range": 0.02, "loss_fn": "aam", "mean_norm": true, "model_type": "xvector", "n_mels": 40, "norm_type": "sentence", "num_classes": 5994, "sample_rate": 16000, "std_norm": false, "tdnn_blocks": 5, "tdnn_channels": [ 512, 512, 512, 512, 1500 ], "tdnn_dilations": [ 1, 2, 3, 1, 1 ], "tdnn_kernel_sizes": [ 5, 3, 3, 1, 1 ], "torch_dtype": "float32", "transformers_version": "4.31.0", "win_length": 25 }