audio_root: N/A standardize_audio: true use_audio_input: true vocab_filename: dict.txt tgt_lang: eos_token: hub: input_type: standardized_waveform #tts_model_id: facebookresearch/fairseq:ust:unit_hifigan_mhubert_vp_en_es_fr_it3_400k_layer11_km1000_lj_dur #unit_vocoder: true #generation_args: # beam: 10 # max_len_a: 0.003125