swordi commited on
Commit
b9cdd17
1 Parent(s): add9a0f

Upload 32 files

Browse files
Files changed (32) hide show
  1. dump/22k/xvector/dev/spk_xvector.ark +0 -0
  2. dump/22k/xvector/dev/spk_xvector.scp +8 -0
  3. dump/22k/xvector/test/spk_xvector.ark +0 -0
  4. dump/22k/xvector/test/spk_xvector.scp +8 -0
  5. dump/22k/xvector/train/spk_xvector.ark +0 -0
  6. dump/22k/xvector/train/spk_xvector.scp +8 -0
  7. exp/22k/tts_stats_raw_linear_spectrogram_char/train/feats_stats.npz +3 -0
  8. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/531epoch.pth +3 -0
  9. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/config.yaml +421 -0
  10. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_backward_time.png +0 -0
  11. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_fake_loss.png +0 -0
  12. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_forward_time.png +0 -0
  13. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_loss.png +0 -0
  14. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_optim_step_time.png +0 -0
  15. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_real_loss.png +0 -0
  16. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_train_time.png +0 -0
  17. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_adv_loss.png +0 -0
  18. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_backward_time.png +0 -0
  19. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_dur_loss.png +0 -0
  20. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_feat_match_loss.png +0 -0
  21. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_forward_time.png +0 -0
  22. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_kl_loss.png +0 -0
  23. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_loss.png +0 -0
  24. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_mel_loss.png +0 -0
  25. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_optim_step_time.png +0 -0
  26. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_train_time.png +0 -0
  27. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/gpu_max_cached_mem_GB.png +0 -0
  28. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/iter_time.png +0 -0
  29. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/optim0_lr0.png +0 -0
  30. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/optim1_lr0.png +0 -0
  31. exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/train_time.png +0 -0
  32. meta.yaml +8 -0
dump/22k/xvector/dev/spk_xvector.ark ADDED
Binary file (16.5 kB). View file
 
dump/22k/xvector/dev/spk_xvector.scp ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ ag dump/22k/xvector/dev/spk_xvector.ark:3
2
+ be dump/22k/xvector/dev/spk_xvector.ark:2064
3
+ bs dump/22k/xvector/dev/spk_xvector.ark:4125
4
+ gr dump/22k/xvector/dev/spk_xvector.ark:6186
5
+ lu dump/22k/xvector/dev/spk_xvector.ark:8247
6
+ sg dump/22k/xvector/dev/spk_xvector.ark:10308
7
+ vs dump/22k/xvector/dev/spk_xvector.ark:12369
8
+ zh dump/22k/xvector/dev/spk_xvector.ark:14430
dump/22k/xvector/test/spk_xvector.ark ADDED
Binary file (16.5 kB). View file
 
dump/22k/xvector/test/spk_xvector.scp ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ ag dump/22k/xvector/test/spk_xvector.ark:3
2
+ be dump/22k/xvector/test/spk_xvector.ark:2064
3
+ bs dump/22k/xvector/test/spk_xvector.ark:4125
4
+ gr dump/22k/xvector/test/spk_xvector.ark:6186
5
+ lu dump/22k/xvector/test/spk_xvector.ark:8247
6
+ sg dump/22k/xvector/test/spk_xvector.ark:10308
7
+ vs dump/22k/xvector/test/spk_xvector.ark:12369
8
+ zh dump/22k/xvector/test/spk_xvector.ark:14430
dump/22k/xvector/train/spk_xvector.ark ADDED
Binary file (16.5 kB). View file
 
dump/22k/xvector/train/spk_xvector.scp ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ ag dump/22k/xvector/train/spk_xvector.ark:3
2
+ be dump/22k/xvector/train/spk_xvector.ark:2064
3
+ bs dump/22k/xvector/train/spk_xvector.ark:4125
4
+ gr dump/22k/xvector/train/spk_xvector.ark:6186
5
+ lu dump/22k/xvector/train/spk_xvector.ark:8247
6
+ sg dump/22k/xvector/train/spk_xvector.ark:10308
7
+ vs dump/22k/xvector/train/spk_xvector.ark:12369
8
+ zh dump/22k/xvector/train/spk_xvector.ark:14430
exp/22k/tts_stats_raw_linear_spectrogram_char/train/feats_stats.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32505e8615c5b8d0714fae280e0f87f4c1167ce606fb8974d8107e37b2819435
3
+ size 4866
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/531epoch.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4f95732c07f1d6072f34a50cbab463b59720736f03b0612458a8fa9544477e4
3
+ size 386482802
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/config.yaml ADDED
@@ -0,0 +1,421 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ config: ./conf/tuning/train+xvector_vits.yaml
2
+ print_config: false
3
+ log_level: INFO
4
+ dry_run: false
5
+ iterator_type: sequence
6
+ output_dir: exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial
7
+ ngpu: 1
8
+ seed: 777
9
+ num_workers: 4
10
+ num_att_plot: 3
11
+ dist_backend: nccl
12
+ dist_init_method: env://
13
+ dist_world_size: 4
14
+ dist_rank: 0
15
+ local_rank: 0
16
+ dist_master_addr: localhost
17
+ dist_master_port: 50305
18
+ dist_launcher: null
19
+ multiprocessing_distributed: true
20
+ unused_parameters: true
21
+ sharded_ddp: false
22
+ cudnn_enabled: true
23
+ cudnn_benchmark: false
24
+ cudnn_deterministic: false
25
+ collect_stats: false
26
+ write_collected_feats: false
27
+ max_epoch: 1000
28
+ patience: null
29
+ val_scheduler_criterion:
30
+ - valid
31
+ - loss
32
+ early_stopping_criterion:
33
+ - valid
34
+ - loss
35
+ - min
36
+ best_model_criterion:
37
+ - - train
38
+ - total_count
39
+ - max
40
+ keep_nbest_models: 10
41
+ nbest_averaging_interval: 0
42
+ grad_clip: -1
43
+ grad_clip_type: 2.0
44
+ grad_noise: false
45
+ accum_grad: 1
46
+ no_forward_run: false
47
+ resume: true
48
+ train_dtype: float32
49
+ use_amp: false
50
+ log_interval: 50
51
+ use_matplotlib: true
52
+ use_tensorboard: true
53
+ use_wandb: true
54
+ wandb_project: null
55
+ wandb_id: vits-ch-ch-char-swissDial
56
+ wandb_entity: null
57
+ wandb_name: null
58
+ wandb_model_log_interval: -1
59
+ detect_anomaly: false
60
+ pretrain_path: null
61
+ init_param: []
62
+ ignore_init_mismatch: false
63
+ freeze_param: []
64
+ num_iters_per_epoch: 1000
65
+ batch_size: 20
66
+ valid_batch_size: null
67
+ batch_bins: 5000000
68
+ valid_batch_bins: null
69
+ train_shape_file:
70
+ - exp/22k/tts_stats_raw_linear_spectrogram_char/train/text_shape.char
71
+ - exp/22k/tts_stats_raw_linear_spectrogram_char/train/speech_shape
72
+ valid_shape_file:
73
+ - exp/22k/tts_stats_raw_linear_spectrogram_char/valid/text_shape.char
74
+ - exp/22k/tts_stats_raw_linear_spectrogram_char/valid/speech_shape
75
+ batch_type: numel
76
+ valid_batch_type: null
77
+ fold_length:
78
+ - 150
79
+ - 204800
80
+ sort_in_batch: descending
81
+ sort_batch: descending
82
+ multiple_iterator: false
83
+ chunk_length: 500
84
+ chunk_shift_ratio: 0.5
85
+ num_cache_chunks: 1024
86
+ train_data_path_and_name_and_type:
87
+ - - dump/22k/raw/train/text
88
+ - text
89
+ - text
90
+ - - dump/22k/raw/train/wav.scp
91
+ - speech
92
+ - sound
93
+ - - dump/22k/xvector/train/xvector.scp
94
+ - spembs
95
+ - kaldi_ark
96
+ valid_data_path_and_name_and_type:
97
+ - - dump/22k/raw/dev/text
98
+ - text
99
+ - text
100
+ - - dump/22k/raw/dev/wav.scp
101
+ - speech
102
+ - sound
103
+ - - dump/22k/xvector/dev/xvector.scp
104
+ - spembs
105
+ - kaldi_ark
106
+ allow_variable_data_keys: false
107
+ max_cache_size: 0.0
108
+ max_cache_fd: 32
109
+ valid_max_cache_size: null
110
+ optim: adamw
111
+ optim_conf:
112
+ lr: 0.0002
113
+ betas:
114
+ - 0.8
115
+ - 0.99
116
+ eps: 1.0e-09
117
+ weight_decay: 0.0
118
+ scheduler: exponentiallr
119
+ scheduler_conf:
120
+ gamma: 0.999875
121
+ optim2: adamw
122
+ optim2_conf:
123
+ lr: 0.0002
124
+ betas:
125
+ - 0.8
126
+ - 0.99
127
+ eps: 1.0e-09
128
+ weight_decay: 0.0
129
+ scheduler2: exponentiallr
130
+ scheduler2_conf:
131
+ gamma: 0.999875
132
+ generator_first: false
133
+ token_list:
134
+ - <blank>
135
+ - <unk>
136
+ - <space>
137
+ - e
138
+ - i
139
+ - r
140
+ - s
141
+ - t
142
+ - a
143
+ - n
144
+ - h
145
+ - d
146
+ - l
147
+ - o
148
+ - u
149
+ - c
150
+ - g
151
+ - m
152
+ - .
153
+ - b
154
+ - f
155
+ - ä
156
+ - w
157
+ - z
158
+ - k
159
+ - v
160
+ - ü
161
+ - S
162
+ - p
163
+ - ','
164
+ - D
165
+ - ö
166
+ - B
167
+ - A
168
+ - M
169
+ - E
170
+ - W
171
+ - G
172
+ - F
173
+ - P
174
+ - I
175
+ - K
176
+ - T
177
+ - R
178
+ - H
179
+ - L
180
+ - V
181
+ - N
182
+ - U
183
+ - C
184
+ - Z
185
+ - '0'
186
+ - '-'
187
+ - J
188
+ - ''''
189
+ - '"'
190
+ - j
191
+ - O
192
+ - y
193
+ - '1'
194
+ - '2'
195
+ - x
196
+ - Ä
197
+ - '9'
198
+ - '?'
199
+ - '5'
200
+ - ':'
201
+ - '3'
202
+ - '6'
203
+ - '8'
204
+ - '7'
205
+ - '4'
206
+ - Ü
207
+ - q
208
+ - Ö
209
+ - Q
210
+ - '!'
211
+ - Y
212
+ - X
213
+ - /
214
+ - ;
215
+ - é
216
+ - ’
217
+ - –
218
+ - è
219
+ - ê
220
+ - ç
221
+ - )
222
+ - à
223
+ - (
224
+ - '&'
225
+ - â
226
+ - '%'
227
+ - «
228
+ - »
229
+ - _
230
+ - ß
231
+ - ô
232
+ - ñ
233
+ - ë
234
+ - ò
235
+ - ã
236
+ - ï
237
+ - ‘
238
+ - <sos/eos>
239
+ odim: null
240
+ model_conf: {}
241
+ use_preprocessor: true
242
+ token_type: char
243
+ bpemodel: null
244
+ non_linguistic_symbols: null
245
+ cleaner: null
246
+ g2p: null
247
+ feats_extract: linear_spectrogram
248
+ feats_extract_conf:
249
+ n_fft: 1024
250
+ hop_length: 256
251
+ win_length: null
252
+ normalize: null
253
+ normalize_conf: {}
254
+ tts: vits
255
+ tts_conf:
256
+ generator_type: vits_generator
257
+ generator_params:
258
+ hidden_channels: 192
259
+ spks: -1
260
+ spk_embed_dim: 512
261
+ global_channels: 256
262
+ segment_size: 32
263
+ text_encoder_attention_heads: 2
264
+ text_encoder_ffn_expand: 4
265
+ text_encoder_blocks: 6
266
+ text_encoder_positionwise_layer_type: conv1d
267
+ text_encoder_positionwise_conv_kernel_size: 3
268
+ text_encoder_positional_encoding_layer_type: rel_pos
269
+ text_encoder_self_attention_layer_type: rel_selfattn
270
+ text_encoder_activation_type: swish
271
+ text_encoder_normalize_before: true
272
+ text_encoder_dropout_rate: 0.1
273
+ text_encoder_positional_dropout_rate: 0.0
274
+ text_encoder_attention_dropout_rate: 0.1
275
+ use_macaron_style_in_text_encoder: true
276
+ use_conformer_conv_in_text_encoder: false
277
+ text_encoder_conformer_kernel_size: -1
278
+ decoder_kernel_size: 7
279
+ decoder_channels: 512
280
+ decoder_upsample_scales:
281
+ - 8
282
+ - 8
283
+ - 2
284
+ - 2
285
+ decoder_upsample_kernel_sizes:
286
+ - 16
287
+ - 16
288
+ - 4
289
+ - 4
290
+ decoder_resblock_kernel_sizes:
291
+ - 3
292
+ - 7
293
+ - 11
294
+ decoder_resblock_dilations:
295
+ - - 1
296
+ - 3
297
+ - 5
298
+ - - 1
299
+ - 3
300
+ - 5
301
+ - - 1
302
+ - 3
303
+ - 5
304
+ use_weight_norm_in_decoder: true
305
+ posterior_encoder_kernel_size: 5
306
+ posterior_encoder_layers: 16
307
+ posterior_encoder_stacks: 1
308
+ posterior_encoder_base_dilation: 1
309
+ posterior_encoder_dropout_rate: 0.0
310
+ use_weight_norm_in_posterior_encoder: true
311
+ flow_flows: 4
312
+ flow_kernel_size: 5
313
+ flow_base_dilation: 1
314
+ flow_layers: 4
315
+ flow_dropout_rate: 0.0
316
+ use_weight_norm_in_flow: true
317
+ use_only_mean_in_flow: true
318
+ stochastic_duration_predictor_kernel_size: 3
319
+ stochastic_duration_predictor_dropout_rate: 0.5
320
+ stochastic_duration_predictor_flows: 4
321
+ stochastic_duration_predictor_dds_conv_layers: 3
322
+ vocabs: 105
323
+ aux_channels: 513
324
+ discriminator_type: hifigan_multi_scale_multi_period_discriminator
325
+ discriminator_params:
326
+ scales: 1
327
+ scale_downsample_pooling: AvgPool1d
328
+ scale_downsample_pooling_params:
329
+ kernel_size: 4
330
+ stride: 2
331
+ padding: 2
332
+ scale_discriminator_params:
333
+ in_channels: 1
334
+ out_channels: 1
335
+ kernel_sizes:
336
+ - 15
337
+ - 41
338
+ - 5
339
+ - 3
340
+ channels: 128
341
+ max_downsample_channels: 1024
342
+ max_groups: 16
343
+ bias: true
344
+ downsample_scales:
345
+ - 2
346
+ - 2
347
+ - 4
348
+ - 4
349
+ - 1
350
+ nonlinear_activation: LeakyReLU
351
+ nonlinear_activation_params:
352
+ negative_slope: 0.1
353
+ use_weight_norm: true
354
+ use_spectral_norm: false
355
+ follow_official_norm: false
356
+ periods:
357
+ - 2
358
+ - 3
359
+ - 5
360
+ - 7
361
+ - 11
362
+ period_discriminator_params:
363
+ in_channels: 1
364
+ out_channels: 1
365
+ kernel_sizes:
366
+ - 5
367
+ - 3
368
+ channels: 32
369
+ downsample_scales:
370
+ - 3
371
+ - 3
372
+ - 3
373
+ - 3
374
+ - 1
375
+ max_downsample_channels: 1024
376
+ bias: true
377
+ nonlinear_activation: LeakyReLU
378
+ nonlinear_activation_params:
379
+ negative_slope: 0.1
380
+ use_weight_norm: true
381
+ use_spectral_norm: false
382
+ generator_adv_loss_params:
383
+ average_by_discriminators: false
384
+ loss_type: mse
385
+ discriminator_adv_loss_params:
386
+ average_by_discriminators: false
387
+ loss_type: mse
388
+ feat_match_loss_params:
389
+ average_by_discriminators: false
390
+ average_by_layers: false
391
+ include_final_outputs: true
392
+ mel_loss_params:
393
+ fs: 22050
394
+ n_fft: 1024
395
+ hop_length: 256
396
+ win_length: null
397
+ window: hann
398
+ n_mels: 80
399
+ fmin: 0
400
+ fmax: null
401
+ log_base: null
402
+ lambda_adv: 1.0
403
+ lambda_mel: 45.0
404
+ lambda_feat_match: 2.0
405
+ lambda_dur: 1.0
406
+ lambda_kl: 1.0
407
+ sampling_rate: 22050
408
+ cache_generator_outputs: true
409
+ pitch_extract: null
410
+ pitch_extract_conf: {}
411
+ pitch_normalize: null
412
+ pitch_normalize_conf: {}
413
+ energy_extract: null
414
+ energy_extract_conf: {}
415
+ energy_normalize: null
416
+ energy_normalize_conf: {}
417
+ required:
418
+ - output_dir
419
+ - token_list
420
+ version: 0.10.7a1
421
+ distributed: true
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_backward_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_fake_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_forward_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_optim_step_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_real_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/discriminator_train_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_adv_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_backward_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_dur_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_feat_match_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_forward_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_kl_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_mel_loss.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_optim_step_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/generator_train_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/gpu_max_cached_mem_GB.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/iter_time.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/optim0_lr0.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/optim1_lr0.png ADDED
exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/images/train_time.png ADDED
meta.yaml ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ espnet: 0.10.7a1
2
+ files:
3
+ model_file: exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/531epoch.pth
4
+ python: "3.8.13 (default, Mar 28 2022, 11:38:47) \n[GCC 7.5.0]"
5
+ timestamp: 1669995093.126856
6
+ torch: 1.10.1+cu113
7
+ yaml_files:
8
+ train_config: exp/22k/tts_train+xvector_vits_raw_char_use_wandbtrue_resumetrue_wandb_idvits-ch-ch-char-swissDial/config.yaml