Rongjiehuang commited on
Commit
8cbdd7d
1 Parent(s): 4b82ff1
egs/egs_bases/tts/vocoder/hifigan.yaml ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ base_config: ./base.yaml
2
+ task_cls: tasks.vocoder.hifigan.HifiGanTask
3
+ resblock: "1"
4
+ adam_b1: 0.8
5
+ adam_b2: 0.99
6
+ upsample_rates: [ 8,8,2,2 ]
7
+ upsample_kernel_sizes: [ 16,16,4,4 ]
8
+ upsample_initial_channel: 512
9
+ resblock_kernel_sizes: [ 3,7,11 ]
10
+ resblock_dilation_sizes: [ [ 1,3,5 ], [ 1,3,5 ], [ 1,3,5 ] ]
11
+
12
+ use_pitch_embed: false
13
+ use_fm_loss: false
14
+ use_spec_disc: false
15
+ use_cdisc: false
16
+ use_ms_stft: false
17
+ use_cond_disc: false
18
+
19
+ lambda_mel: 5.0
20
+ lambda_mel_adv: 1.0
21
+ lambda_cdisc: 4.0
22
+ lambda_adv: 1.0
23
+
24
+ max_samples: 8192
25
+ max_sentences: 24
26
+
27
+ aux_context_window: 0 # Context window size for auxiliary feature.
28
+ generator_optimizer_params:
29
+ lr: 0.0002 # Generator's learning rate.
30
+ generator_scheduler_params:
31
+ step_size: 600
32
+ gamma: 0.999
33
+ discriminator_optimizer_params:
34
+ lr: 0.0002 # Discriminator's learning rate.
35
+ discriminator_scheduler_params:
36
+ step_size: 600
37
+ gamma: 0.999
38
+ max_updates: 3000000