import torch

from InferenceInterfaces.UtteranceCloner import UtteranceCloner

if __name__ == '__main__':
    uc = UtteranceCloner(model_id="Nancy", device="cuda" if torch.cuda.is_available() else "cpu")

    # What is said in path_to_reference_audio_for_intonation has to match the text in the reference_transcription exactly!
    uc.clone_utterance(path_to_reference_audio_for_intonation="audios/speaker_references_for_testing/sad.wav",
                       path_to_reference_audio_for_voice="audios/speaker_references_for_testing/female_mid_voice.wav",  # the two reference audios can be the same, but don't have to be
                       transcription_of_intonation_reference="This report is due tomorrow.",
                       filename_of_result="audios/test_cloned.wav",
                       lang="eng")