Tanel commited on
Commit
a5a2e80
1 Parent(s): 5665f33

First model version

Browse files
.gitattributes CHANGED
@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
25
  *.zip filter=lfs diff=lfs merge=lfs -text
26
  *.zstandard filter=lfs diff=lfs merge=lfs -text
27
  *tfevents* filter=lfs diff=lfs merge=lfs -text
28
+ *.ckpt filter=lfs diff=lfs merge=lfs -text
classifier.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a50d9024ff58d317031c9787d4c6c614d454a87a8ef32f9d36338cd3ff57adbc
3
+ size 762555
embedding_model.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab750d5c06d713477045fa798fab5d33e959dbc0dfe4de510a9a47844c79a19a
3
+ size 84474355
hyperparams.yaml ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ pretrained_path: TalTechNLP/voxlingua107-epaca-tdnn-ce
2
+
3
+
4
+ # Feature parameters
5
+ n_mels: 60
6
+ left_frames: 0
7
+ right_frames: 0
8
+ deltas: false
9
+
10
+ # Number of speakers
11
+ out_n_neurons: 107
12
+
13
+ # Functions
14
+ compute_features: !new:speechbrain.lobes.features.Fbank
15
+ n_mels: 60
16
+ left_frames: 0
17
+ right_frames: 0
18
+ deltas: false
19
+
20
+ embedding_model: !new:speechbrain.lobes.models.ECAPA_TDNN.ECAPA_TDNN
21
+ input_size: 60
22
+ channels: [1024, 1024, 1024, 1024, 3072]
23
+ kernel_sizes: [5, 3, 3, 3, 1]
24
+ dilations: [1, 2, 3, 4, 1]
25
+ attention_channels: 128
26
+ lin_neurons: 256
27
+
28
+
29
+ classifier: !new:speechbrain.lobes.models.Xvector.Classifier
30
+ input_shape: [null, null, 256]
31
+ activation: !name:torch.nn.LeakyReLU
32
+ lin_blocks: 1
33
+ lin_neurons: 512
34
+ out_neurons: !ref <out_n_neurons>
35
+
36
+
37
+ mean_var_norm: !new:speechbrain.processing.features.InputNormalization
38
+ norm_type: sentence
39
+ std_norm: false
40
+
41
+ modules:
42
+ compute_features: !ref <compute_features>
43
+ mean_var_norm: !ref <mean_var_norm>
44
+ embedding_model: !ref <embedding_model>
45
+ classifier: !ref <classifier>
46
+
47
+ label_encoder: !new:speechbrain.dataio.encoder.CategoricalEncoder
48
+
49
+ pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
50
+ loadables:
51
+ embedding_model: !ref <embedding_model>
52
+ classifier: !ref <classifier>
53
+ label_encoder: !ref <label_encoder>
54
+ paths:
55
+ embedding_model: !ref <pretrained_path>/embedding_model.ckpt
56
+ classifier: !ref <pretrained_path>/classifier.ckpt
57
+ label_encoder: !ref <pretrained_path>/label_encoder.txt
label_encoder.txt ADDED
@@ -0,0 +1,109 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 'ab' => 0
2
+ 'af' => 1
3
+ 'am' => 2
4
+ 'ar' => 3
5
+ 'as' => 4
6
+ 'az' => 5
7
+ 'ba' => 6
8
+ 'be' => 7
9
+ 'bg' => 8
10
+ 'bn' => 9
11
+ 'bo' => 10
12
+ 'br' => 11
13
+ 'bs' => 12
14
+ 'ca' => 13
15
+ 'ceb' => 14
16
+ 'cs' => 15
17
+ 'cy' => 16
18
+ 'da' => 17
19
+ 'de' => 18
20
+ 'el' => 19
21
+ 'en' => 20
22
+ 'eo' => 21
23
+ 'es' => 22
24
+ 'et' => 23
25
+ 'eu' => 24
26
+ 'fa' => 25
27
+ 'fi' => 26
28
+ 'fo' => 27
29
+ 'fr' => 28
30
+ 'gl' => 29
31
+ 'gn' => 30
32
+ 'gu' => 31
33
+ 'gv' => 32
34
+ 'ha' => 33
35
+ 'haw' => 34
36
+ 'hi' => 35
37
+ 'hr' => 36
38
+ 'ht' => 37
39
+ 'hu' => 38
40
+ 'hy' => 39
41
+ 'ia' => 40
42
+ 'id' => 41
43
+ 'is' => 42
44
+ 'it' => 43
45
+ 'iw' => 44
46
+ 'ja' => 45
47
+ 'jw' => 46
48
+ 'ka' => 47
49
+ 'kk' => 48
50
+ 'km' => 49
51
+ 'kn' => 50
52
+ 'ko' => 51
53
+ 'la' => 52
54
+ 'lb' => 53
55
+ 'ln' => 54
56
+ 'lo' => 55
57
+ 'lt' => 56
58
+ 'lv' => 57
59
+ 'mg' => 58
60
+ 'mi' => 59
61
+ 'mk' => 60
62
+ 'ml' => 61
63
+ 'mn' => 62
64
+ 'mr' => 63
65
+ 'ms' => 64
66
+ 'mt' => 65
67
+ 'my' => 66
68
+ 'ne' => 67
69
+ 'nl' => 68
70
+ 'nn' => 69
71
+ 'no' => 70
72
+ 'oc' => 71
73
+ 'pa' => 72
74
+ 'pl' => 73
75
+ 'ps' => 74
76
+ 'pt' => 75
77
+ 'ro' => 76
78
+ 'ru' => 77
79
+ 'sa' => 78
80
+ 'sco' => 79
81
+ 'sd' => 80
82
+ 'si' => 81
83
+ 'sk' => 82
84
+ 'sl' => 83
85
+ 'sn' => 84
86
+ 'so' => 85
87
+ 'sq' => 86
88
+ 'sr' => 87
89
+ 'su' => 88
90
+ 'sv' => 89
91
+ 'sw' => 90
92
+ 'ta' => 91
93
+ 'te' => 92
94
+ 'tg' => 93
95
+ 'th' => 94
96
+ 'tk' => 95
97
+ 'tl' => 96
98
+ 'tr' => 97
99
+ 'tt' => 98
100
+ 'uk' => 99
101
+ 'ur' => 100
102
+ 'uz' => 101
103
+ 'vi' => 102
104
+ 'war' => 103
105
+ 'yi' => 104
106
+ 'yo' => 105
107
+ 'zh' => 106
108
+ ================
109
+ 'starting_index' => 0
normalizer.ckpt ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c369e01dfa2e0d84c6b116f33c7b94f1fe28c061642086538e93cde3d97c26ef
3
+ size 1063