bayartsogt commited on
Commit
2587880
1 Parent(s): f8da4c9
Files changed (8) hide show
  1. README.md +17 -0
  2. config.yaml +24 -0
  3. gcmvn_stats.npz +0 -0
  4. pytorch_model.pt +3 -0
  5. speakers.txt +1 -0
  6. spm_char.model +3 -0
  7. spm_char.txt +40 -0
  8. spm_char.vocab +44 -0
README.md ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: fairseq
3
+ task: text-to-speech
4
+ tags:
5
+ - fairseq
6
+ - audio
7
+ - text-to-speech
8
+ language: mn
9
+ datasets:
10
+ - mbspeech
11
+ ---
12
+ # tts_transformer-mn-mbspeech
13
+ [Transformer](https://arxiv.org/abs/1809.08895) text-to-speech model from fairseq S^2 ([paper](https://arxiv.org/abs/2109.06912)/[code](https://github.com/pytorch/fairseq/tree/main/examples/speech_synthesis)):
14
+ - Vietnamese
15
+ - Single-speaker male voice
16
+ - Trained on [MBSpeech](https://github.com/tugstugi/mongolian-nlp/blob/master/datasets/MBSpeech-1.0-csv.zip)
17
+
config.yaml ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ bpe_tokenizer:
2
+ bpe: sentencepiece
3
+ sentencepiece_model: spm_char.model
4
+ features:
5
+ eps: 1.0e-05
6
+ f_max: 8000
7
+ f_min: 20
8
+ hop_len_t: 0.011609977324263039
9
+ hop_length: 256
10
+ n_fft: 1024
11
+ n_mels: 80
12
+ n_stft: 513
13
+ sample_rate: 22050
14
+ type: spectrogram+melscale+log
15
+ win_len_t: 0.046439909297052155
16
+ win_length: 1024
17
+ window_fn: hann
18
+ global_cmvn:
19
+ stats_npz_path: gcmvn_stats.npz
20
+ sample_rate: 22050
21
+ transforms:
22
+ '*':
23
+ - global_cmvn
24
+ vocab_filename: spm_char.txt
gcmvn_stats.npz ADDED
Binary file (1.14 kB). View file
 
pytorch_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb65454af66ec96eef3825fab2a9fd66ed604282eba7c0c4b34e7306ce0b8730
3
+ size 652966179
speakers.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ mbspeech
spm_char.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3ac7e7fcce150657c687f1bb3d5980bd7ce97d632540b4c1334064426d4e47
3
+ size 238217
spm_char.txt ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ▁ 1
2
+ а 1
3
+ н 1
4
+ э 1
5
+ г 1
6
+ р 1
7
+ и 1
8
+ д 1
9
+ х 1
10
+ л 1
11
+ ү 1
12
+ т 1
13
+ о 1
14
+ й 1
15
+ у 1
16
+ ө 1
17
+ с 1
18
+ б 1
19
+ м 1
20
+ в 1
21
+ . 1
22
+ ч 1
23
+ з 1
24
+ ж 1
25
+ ы 1
26
+ е 1
27
+ , 1
28
+ ь 1
29
+ ш 1
30
+ ц 1
31
+ я 1
32
+ ю 1
33
+ ё 1
34
+ к 1
35
+ ф 1
36
+ п 1
37
+ ! 1
38
+ ? 1
39
+ ъ 1
40
+ щ 1
spm_char.vocab ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ <s> 0
2
+ <pad> 0
3
+ </s> 0
4
+ <unk> 0
5
+ ▁ -1.87835
6
+ а -2.3376
7
+ н -2.66474
8
+ э -2.67631
9
+ г -3.00228
10
+ р -3.081
11
+ и -3.1159
12
+ д -3.1658
13
+ х -3.2745
14
+ л -3.31839
15
+ ү -3.36249
16
+ т -3.43907
17
+ о -3.4786
18
+ й -3.4863
19
+ у -3.49546
20
+ ө -3.78138
21
+ с -3.79323
22
+ б -3.79863
23
+ м -4.01439
24
+ в -4.19775
25
+ . -4.37665
26
+ ч -4.46334
27
+ з -4.52161
28
+ ж -4.64295
29
+ ы -4.76725
30
+ е -4.81287
31
+ , -4.81325
32
+ ь -4.84147
33
+ ш -5.19829
34
+ ц -5.46254
35
+ я -5.75058
36
+ ю -6.61326
37
+ ё -6.61552
38
+ к -6.68832
39
+ ф -6.75376
40
+ п -7.32121
41
+ ! -8.05174
42
+ ? -8.05174
43
+ ъ -9.32131
44
+ щ -13.3988