inference:
  file_path: "output.wav"
  speaker_wav: "content/speaker.wav"
  language: "en"
  model: "tts_models/multilingual/multi-dataset/xtts_v2"

recording:
  recorded_wav: "content/recorded/recorded.wav"