Roh commited on
Commit
7724395
1 Parent(s): 70f828b

add model files

Browse files
exp/tts_stats_raw_phn_tacotron_g2p_en_no_space/train/feats_stats.npz ADDED
Binary file (1.4 kB). View file
exp/tts_train_raw_phn_tacotron_g2p_en_no_space/200epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9ee619851c566303464627625421917999ea9f6ea9fa0e229cb6cea7f8869ae
3
+ size 106844004
exp/tts_train_raw_phn_tacotron_g2p_en_no_space/checkpoint.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32f3aab15b36c7c7fc78b6134408ebc28d2292b9297ae556e2a2647b926e062d
3
+ size 320276378
exp/tts_train_raw_phn_tacotron_g2p_en_no_space/config.yaml ADDED
@@ -0,0 +1,242 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: conf/train.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/tts_train_raw_phn_tacotron_g2p_en_no_space
7
+ ngpu: 1
8
+ seed: 0
9
+ num_workers: 1
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: null
14
+ dist_rank: null
15
+ local_rank: 0
16
+ dist_master_addr: null
17
+ dist_master_port: null
18
+ dist_launcher: null
19
+ multiprocessing_distributed: false
20
+ cudnn_enabled: true
21
+ cudnn_benchmark: false
22
+ cudnn_deterministic: true
23
+ collect_stats: false
24
+ write_collected_feats: false
25
+ max_epoch: 200
26
+ patience: null
27
+ val_scheduler_criterion:
28
+ - valid
29
+ - loss
30
+ early_stopping_criterion:
31
+ - valid
32
+ - loss
33
+ - min
34
+ best_model_criterion:
35
+ - - valid
36
+ - loss
37
+ - min
38
+ - - train
39
+ - loss
40
+ - min
41
+ keep_nbest_models: 5
42
+ grad_clip: 1.0
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: false
50
+ log_interval: null
51
+ pretrain_path: []
52
+ pretrain_key: []
53
+ num_iters_per_epoch: 500
54
+ batch_size: 20
55
+ valid_batch_size: null
56
+ batch_bins: 5120000
57
+ valid_batch_bins: null
58
+ train_shape_file:
59
+ - exp/tts_stats_raw_phn_tacotron_g2p_en_no_space/train/text_shape.phn
60
+ - exp/tts_stats_raw_phn_tacotron_g2p_en_no_space/train/speech_shape
61
+ valid_shape_file:
62
+ - exp/tts_stats_raw_phn_tacotron_g2p_en_no_space/valid/text_shape.phn
63
+ - exp/tts_stats_raw_phn_tacotron_g2p_en_no_space/valid/speech_shape
64
+ batch_type: numel
65
+ valid_batch_type: null
66
+ fold_length:
67
+ - 150
68
+ - 204800
69
+ sort_in_batch: descending
70
+ sort_batch: descending
71
+ multiple_iterator: false
72
+ chunk_length: 500
73
+ chunk_shift_ratio: 0.5
74
+ num_cache_chunks: 1024
75
+ train_data_path_and_name_and_type:
76
+ - - dump/raw/tr_no_dev/text
77
+ - text
78
+ - text
79
+ - - dump/raw/tr_no_dev/wav.scp
80
+ - speech
81
+ - sound
82
+ valid_data_path_and_name_and_type:
83
+ - - dump/raw/dev/text
84
+ - text
85
+ - text
86
+ - - dump/raw/dev/wav.scp
87
+ - speech
88
+ - sound
89
+ allow_variable_data_keys: false
90
+ max_cache_size: 0.0
91
+ max_cache_fd: 32
92
+ valid_max_cache_size: null
93
+ optim: adam
94
+ optim_conf:
95
+ lr: 0.001
96
+ eps: 1.0e-06
97
+ weight_decay: 0.0
98
+ scheduler: null
99
+ scheduler_conf: {}
100
+ token_list:
101
+ - <blank>
102
+ - <unk>
103
+ - AH0
104
+ - T
105
+ - N
106
+ - S
107
+ - R
108
+ - D
109
+ - L
110
+ - K
111
+ - IH1
112
+ - M
113
+ - EH1
114
+ - Z
115
+ - DH
116
+ - UW1
117
+ - AE1
118
+ - IH0
119
+ - AY1
120
+ - AH1
121
+ - W
122
+ - .
123
+ - P
124
+ - F
125
+ - IY1
126
+ - V
127
+ - ER0
128
+ - AA1
129
+ - B
130
+ - AO1
131
+ - HH
132
+ - EY1
133
+ - IY0
134
+ - ','
135
+ - Y
136
+ - NG
137
+ - OW1
138
+ - G
139
+ - AW1
140
+ - TH
141
+ - SH
142
+ - UH1
143
+ - '?'
144
+ - ER1
145
+ - JH
146
+ - CH
147
+ - OW0
148
+ - OW2
149
+ - EH2
150
+ - IH2
151
+ - EY2
152
+ - AA2
153
+ - AE2
154
+ - AY2
155
+ - ''''
156
+ - OY1
157
+ - UW0
158
+ - '!'
159
+ - AO2
160
+ - EH0
161
+ - ZH
162
+ - AH2
163
+ - AE0
164
+ - UW2
165
+ - AA0
166
+ - AY0
167
+ - IY2
168
+ - AW2
169
+ - AO0
170
+ - EY0
171
+ - ER2
172
+ - UH2
173
+ - '...'
174
+ - AW0
175
+ - UH0
176
+ - OY2
177
+ - <sos/eos>
178
+ odim: null
179
+ model_conf: {}
180
+ use_preprocessor: true
181
+ token_type: phn
182
+ bpemodel: null
183
+ non_linguistic_symbols: null
184
+ cleaner: tacotron
185
+ g2p: g2p_en_no_space
186
+ feats_extract: fbank
187
+ feats_extract_conf:
188
+ fs: 22050
189
+ fmin: 80
190
+ fmax: 7600
191
+ n_mels: 80
192
+ hop_length: 256
193
+ n_fft: 1024
194
+ win_length: null
195
+ normalize: global_mvn
196
+ normalize_conf:
197
+ stats_file: exp/tts_stats_raw_phn_tacotron_g2p_en_no_space/train/feats_stats.npz
198
+ tts: tacotron2
199
+ tts_conf:
200
+ embed_dim: 512
201
+ elayers: 1
202
+ eunits: 512
203
+ econv_layers: 3
204
+ econv_chans: 512
205
+ econv_filts: 5
206
+ atype: location
207
+ adim: 512
208
+ aconv_chans: 32
209
+ aconv_filts: 15
210
+ cumulate_att_w: true
211
+ dlayers: 2
212
+ dunits: 1024
213
+ prenet_layers: 2
214
+ prenet_units: 256
215
+ postnet_layers: 5
216
+ postnet_chans: 512
217
+ postnet_filts: 5
218
+ output_activation: null
219
+ use_batch_norm: true
220
+ use_concate: true
221
+ use_residual: false
222
+ dropout_rate: 0.5
223
+ zoneout_rate: 0.1
224
+ reduction_factor: 1
225
+ spk_embed_dim: null
226
+ use_masking: true
227
+ bce_pos_weight: 5.0
228
+ use_guided_attn_loss: true
229
+ guided_attn_loss_sigma: 0.4
230
+ guided_attn_loss_lambda: 1.0
231
+ pitch_extract: null
232
+ pitch_extract_conf: {}
233
+ pitch_normalize: null
234
+ pitch_normalize_conf: {}
235
+ energy_extract: null
236
+ energy_extract_conf: {}
237
+ energy_normalize: null
238
+ energy_normalize_conf: {}
239
+ required:
240
+ - output_dir
241
+ - token_list
242
+ distributed: false