File size: 1,147 Bytes
4451360
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44

# restore_model: ''
restore_model: ./pretrained/fastpitch_ar_adv.pth
# restore_model: ./checkpoints/exp_fp_adv/states.pth

log_dir: logs/exp_fp_adv
checkpoint_dir: checkpoints/exp_fp_adv

# dataset
train_wavs_path: G:/data/arabic-speech-corpus/wav_new
train_labels: ./data/train_phon.txt

test_wavs_path: G:/data/arabic-speech-corpus/test set/wav_new
test_labels: ./data/test_phon.txt

label_pattern: '"(?P<filename>.*)" "(?P<phonemes>.*)"'
# label_pattern: (?P<arabic>.*)\|(?P<filestem>.*)

# for fastpitch
f0_dict_path: ./data/pitch_dict.pt

f0_mean: 130.05478
f0_std: 22.86267

# loss weights
gan_loss_weight: 3.
feat_loss_weight: 1.

# batch sizes
max_lengths: [1000, 1300, 1850, 30000] # 1 frame ≈ 11.6ms
batch_sizes: [10, 8, 6, 4]

# optimizers
g_lr: 1.0e-4    # lr for AdamW optimizer (generator)
g_beta1: 0.     # beta1 for AdamW optimizer (generator)
g_beta2: 0.99   # beta2 for AdamW optimizer (generator)

d_lr: 1.0e-4    # lr for AdamW optimizer (discriminator)
d_beta1: 0.     # beta1 for AdamW optimizer (discriminator)
d_beta2: 0.99   # beta2 for AdamW optimizer (discriminator)

n_save_states_iter: 100
n_save_backup_iter: 1000