Spaces:
Sleeping
Sleeping
File size: 2,122 Bytes
0d80816 ea32d9a 0d80816 ea32d9a b37a421 ea32d9a 0d80816 ea32d9a 0d80816 c455203 0d80816 ea32d9a 0d80816 9da2dd2 0d80816 2afaead 0d80816 23f695d 0d80816 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 |
# Copyright (c) 2023 Amphion.
#
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree
import subprocess
command_to_run = "cd ./modules/monotonic_align;mkdir -p monotonic_align;python setup.py build_ext --inplace;cd /home/user/app"
try:
result = subprocess.check_output(command_to_run, shell=True, text=True)
print("Command output:")
print(result)
except subprocess.CalledProcessError as e:
print(f"Command failed with return code {e.returncode}")
import gradio as gr
import os
import inference
SUPPORTED_SPEAKERS = {
"Cori Samuel":"hifitts_92",
"Phil Benson":"hifitts_6097",
"Mike Pelton":"hifitts_6670",
"Tony Oliva":"hifitts_6671",
"Maria Kasper":"hifitts_8051",
"John Van Stan":"hifitts_9017",
"Helen Taylor":"hifitts_9136",
"Sylviamb":"hifitts_11614",
"Celine Major":"hifitts_11697",
"LikeManyWaters":"hifitts_12787"
}
def tts_inference(
input_text,
target_speaker
):
### Target Speaker ###
target_speaker = SUPPORTED_SPEAKERS[target_speaker]
args_list = ["--config", "./egs/tts/vits_hifitts/exp_config.json"]
args_list += ["--checkpoint_path", "./latest-checkpoint"]
args_list += ["--speaker_name", target_speaker]
args_list += ["--text", input_text]
args_list += ["--mode","single"]
args_list += ["--output_dir", "result"]
args_list += ["--log_level", "debug"]
os.environ["WORK_DIR"] = "./"
inference.main(args_list)
### Display ###
result_file = os.path.join(
"result/single/test_pred.wav"
)
return result_file
demo_inputs = [
gr.Textbox(
label="Input text",
type="text",
placeholder="Type something here.."
),
gr.Radio(
choices=list(SUPPORTED_SPEAKERS.keys()),
label="Target Speaker",
value="Cori Samuel"
)
]
demo_output = gr.Audio(label="")
demo = gr.Interface(
fn=tts_inference,
inputs=demo_inputs,
outputs=demo_output,
title="Amphion Text-to-Speech",
)
if __name__ == "__main__":
demo.launch(share=True) |