audio_root: N/A | |
standardize_audio: true | |
use_audio_input: true | |
vocab_filename: dict.txt | |
tgt_lang: <lang:en> | |
eos_token: <lang:en> | |
hub: | |
input_type: standardized_waveform | |
#tts_model_id: facebookresearch/fairseq:ust:unit_hifigan_mhubert_vp_en_es_fr_it3_400k_layer11_km1000_lj_dur | |
#unit_vocoder: true | |
#generation_args: | |
# beam: 10 | |
# max_len_a: 0.003125 |