File size: 5,521 Bytes
885eaab |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 |
additional_config: conf/vtn.tts_pt.v1.ppg_sxliu.yaml
allow_cache: true
batch_size: 16
cleaner: tacotron
collater_type: ARVCCollater
config: exp/TXHC_bdl_1032_debug/original_config.yml
criterions:
Seq2SeqLoss:
bce_pos_weight: 10.0
dev_dp_input_dir: null
dev_dumpdir: dump/dev/ppg_sxliu_norm
dev_duration_dir: null
dev_text: data/dev/text
distributed: false
eval_interval_steps: 500
feat_type: ppg_sxliu
fft_size: 1024
fmax: 7600
fmin: 80
format: hdf5
freeze-mods: null
g2p: g2p_en
global_gain_scale: 1.0
grad_norm: 1.0
hop_size: 256
inference:
maxlenratio: 6.0
minlenratio: 0.0
threshold: 0.5
init-mods:
- encoder
- decoder
- feat_out
- prob_out
- postnet
init_checkpoint: exp/TXHC_bdl_1032_debug/original_checkpoint-50000steps.pkl
log_interval_steps: 10
model_params:
adim: 384
aheads: 4
decoder_concat_after: false
decoder_normalize_before: false
decoder_reduction_factor: 2
dlayers: 6
dprenet_layers: 2
dprenet_units: 256
dunits: 1536
elayers: 6
encoder_concat_after: false
encoder_normalize_before: true
eunits: 1536
idim: 144
odim: 144
postnet_chans: 256
postnet_filts: 5
postnet_layers: 5
use_batch_norm: true
model_type: VTN
non_linguistic_symbols: none
num_mels: 80
num_save_intermediate_results: 4
num_workers: 2
optimizer_params:
lr: 8.0e-05
optimizer_type: Adam
outdir: exp/TXHC_bdl_1032_debug
pin_memory: true
pretrain: ''
rank: 0
resume: ''
sampling_rate: 16000
save_interval_steps: 1000
scheduler: warmuplr
scheduler_params:
warmup_steps: 4000
seq2seq_loss_params:
bce_pos_weight: 10.0
src_dev_dumpdir: dump/TXHC_dev/ppg_sxliu/norm_ljspeech
src_feat_type: ppg_sxliu
src_train_dumpdir: dump/TXHC_train_1032/ppg_sxliu/norm_ljspeech
stats:
mean: !!python/object/apply:numpy.core.multiarray._reconstruct
args:
- &id001 !!python/name:numpy.ndarray ''
- !!python/tuple
- 0
- !!binary |
Yg==
state: !!python/tuple
- 1
- !!python/tuple
- 144
- &id002 !!python/object/apply:numpy.dtype
args:
- f4
- false
- true
state: !!python/tuple
- 3
- <
- null
- null
- null
- -1
- -1
- 0
- false
- !!binary |
6RzTPXVNQb7seW+/uWClPQCf5DwPGXQ9G1WePo3UFz6KNp4+FW29PKUMYb5cODu+UbHTPWSOQL53
uc48guEYPn4qgT6KxCO/ER4aPgElyT4BsV6+jpz4valJYj54Z4q+di9MvkSt3z2KlVi/lI+kPVRf
DD+rzu8+CC1svkHG2ruaX9I9tog+vniP5j2YLva8L589vhSeSL/l4PE9s+6VPJZ2szsyuQi+1Opi
PU7OzbxdUNc/RtTqPfLVnL5ASu0+fp6mPuvjLryKgqU9p4hVu2In9T2D1ri+vAz5PHVzzz3ac+G9
Ecu9PZx+Hj6Mrx49kWyAPfqRNj6s4WW+BjmJPlp7+L0eN1g+UzhKPMuUkr7yhl29DwY8viWowbyS
iUe9igiJPX+YgT5CNy++JExQvirydT1kAdA9V3TjvcHclz2aklg+QtSYPahhl75+c9U9yzjjvHAm
973nkJm9KkJEPvg9dL2KZYE+GmnxvGzyk75R9c8+KuMGvqXd6r3sxZg9Nv0jPmTSS76EHfe90mGq
Pd2alb0BxbW+HNUcPxoIwD16mQ++PkZCvhh8jT5I6Kg/HT1pPUMkWj4dO4I9dePAu3qRqb1s/Zo+
G+Mrvf4WIz+DW7o+yHIePsTqRry9aGk+HVjvPRnqc7xE9S495SlKvOMueD9qdKG+kabJvaV17z3B
Q5g8VVjYuvwZbz22gwi+B98XPSBKIz8+dVc+Gq+FPcAYlr301Vw9L0y2vQj5pL36o9Q+sgqHPs++
3z1xMCQ/
scale: !!python/object/apply:numpy.core.multiarray._reconstruct
args:
- *id001
- !!python/tuple
- 0
- !!binary |
Yg==
state: !!python/tuple
- 1
- !!python/tuple
- 144
- *id002
- false
- !!binary |
OanzPqWL3T4RC9M+kg0VP0g2ED8rY/E+UDTvPrfl2T7xOOA+C97MPp688D4/LvE+r3rbPgGi5z47
MNI+VOHEPgbm2D5gJs0+higRP8sS5z7TvQY/y8rXPnlO1j42lvg++sr0PocB5D5JMtU+2mj0PkBu
HD8joiU/1ibePq5jyD4ReO4+CE7YPgbv6j79B7s+euHxPobUxz7c8vc+DhicP9qf6z4SVQA/UpHx
Pu6tzD7MChM/1wj3Po76xz4WyEY/wtvdPkRM6T7xdfg+YGXfPnrHAj984tQ+EFTqPqSQCz+O3RI/
Osq/PsgW1j4aDts+Obr9Ppw45z7nNOU+J9DyPt4D+T468Ao/jzEaP9Fq5j7Gb+U+NALCPrPy3j7U
BA8/Nl73PiCq0T5qr+Y+FaQVP8+d5j5Ave0+jx7oPlKI6j4q5+U+f//IPqW6DD+UWSE/3WPJPix+
2D4+kgU/TnYWP7GX1z55iOo+qHP1PgIh3D6zgD4/MHEJP7zp1z5Aqtw+k1X2Pvynyj5PJ88+lhjX
PrSi2j5F9fk+du3ZPggsyD6yNNE+lmrDPujPNz8Kscc+mx/0Ppaw/T5UoOk+pjHpPgpgxz5flAI/
MnjSPo190j7X2t8+gmvpPlgnFD9q0CY/u8oQP4ER+D536dc+9LfJPnkQAD/rKMI+i4YIP7xyBz+B
nf0+VcTKPqbVAT/ck+I+9uTePhdvAz/UGuo+ahfTPt0/9D7shcQ++VnSPphNzz4Ewvk+DlAoP+91
9j4qV/4+
token_list: exp/phn_tacotron_transformer_tts.v1.ppg_sxliu/tokens.txt
token_type: phn
train_dp_input_dir: null
train_dumpdir: dump/train_no_dev/ppg_sxliu_norm
train_duration_dir: null
train_max_steps: 50000
train_text: data/train_no_dev/text
trainer_type: ARVCTrainer
trg_dev_dumpdir: dump/bdl_dev/ppg_sxliu/norm_ljspeech
trg_feat_type: ppg_sxliu
trg_stats: exp/TXHC_bdl_1032_debug/stats.h5
trg_train_dumpdir: dump/bdl_train_1032/ppg_sxliu/norm_ljspeech
trim_frame_size: 2048
trim_hop_size: 512
trim_silence: false
trim_threshold_in_db: 60
verbose: 1
version: 0.1.0
vocoder:
# checkpoint: /data/group1/z44476r/Experiments/s3prl-vc/egs/l2-arctic/a2o_vc/exp/TXHC_ppg_sxliu_taco2_ar/checkpoint-10000steps.pkl
# config: /data/group1/z44476r/Experiments/s3prl-vc/egs/l2-arctic/a2o_vc/exp/TXHC_ppg_sxliu_taco2_ar/config.yml
# stats: /data/group1/z44476r/Experiments/s3prl-vc/egs/l2-arctic/a2o_vc/exp/TXHC_ppg_sxliu_taco2_ar/stats.h5
checkpoint: /data/group1/z44476r/Experiments/seq2seq-vc/egs/l2-arctic/lsc/downloads/ppg_sxliu_decoder_plus_pwg_THXC/checkpoint-10000steps.pkl
config: /data/group1/z44476r/Experiments/seq2seq-vc/egs/l2-arctic/lsc/downloads/ppg_sxliu_decoder_plus_pwg_THXC/config.yml
stats: /data/group1/z44476r/Experiments/seq2seq-vc/egs/l2-arctic/lsc/downloads/ppg_sxliu_decoder_plus_pwg_THXC/stats.h5
vocoder_type: s3prl_vc
win_length: null
window: hann
|