# ############################################################################ # Model: ECAPA-TDNN for Accent Identification # ############################################################################ # Pretrain folder (HuggingFace) pretrained_path: Jzuluaga/accent-id-commonaccent_ecapa # Feature parameters n_mels: 80 # Output parameters n_languages: 16 # Possible languages in the dataset emb_dim: 192 # dimensionality of the embeddings # Model params compute_features: !new:speechbrain.lobes.features.Fbank n_mels: !ref mean_var_norm: !new:speechbrain.processing.features.InputNormalization norm_type: sentence std_norm: False # Embedding Model embedding_model: !new:speechbrain.lobes.models.ECAPA_TDNN.ECAPA_TDNN input_size: !ref activation: !name:torch.nn.LeakyReLU channels: [1024, 1024, 1024, 1024, 3072] kernel_sizes: [5, 3, 3, 3, 1] dilations: [1, 2, 3, 4, 1] attention_channels: 128 lin_neurons: !ref # Classifier based on cosine distance classifier: !new:speechbrain.lobes.models.ECAPA_TDNN.Classifier input_size: !ref out_neurons: !ref modules: compute_features: !ref mean_var_norm: !ref embedding_model: !ref classifier: !ref label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer loadables: embedding_model: !ref classifier: !ref label_encoder: !ref paths: embedding_model: !ref /embedding_model.ckpt classifier: !ref /classifier.ckpt label_encoder: !ref /accent_encoder.txt