Spaces:

Ionut-Bostan
/

Emotion_Aware_TTS

Sleeping

update app

by Ionut-Bostan - opened May 8

←

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,7 +10,6 @@ predefined_texts = [
 emotion_mapping = {"amused": 0, "anger": 1,
                    "disgust": 2, "neutral": 3, "sleepiness": 4}
 def synthesize_speech(input_type, text, own_text, speaker_id, embed_type, emotion_id):
     if input_type == "Choose from examples":
         selected_text = text
@@ -26,20 +25,21 @@ def synthesize_speech(input_type, text, own_text, speaker_id, embed_type, emotio
     audio_file = f'output/result/EmoV_DB/{selected_text}.wav'
     return audio_file
 iface = gr.Interface(
     fn=synthesize_speech,
-    inputs=[
-        gr.inputs.Radio(
-            ["Choose from examples", "Enter your own text"], label="Input Type"),
-        gr.inputs.Dropdown(choices=predefined_texts, label="Select a text"),
-        gr.inputs.Textbox(lines=2, label="Enter your own text"),
-        gr.inputs.Slider(minimum=0, maximum=3, step=1,
-                         default=0, label="Speaker ID"),
-        gr.inputs.Radio(["bert_embed", "emotion_id"], label="Embedding Type"),
-        gr.inputs.Dropdown(choices=emotion_mapping, label="Select Emotion"),
-    ],
-    outputs=gr.outputs.Audio(type="filepath"),
     title="Text-to-Speech Demo",
 )
 iface.launch()

 emotion_mapping = {"amused": 0, "anger": 1,
                    "disgust": 2, "neutral": 3, "sleepiness": 4}
 def synthesize_speech(input_type, text, own_text, speaker_id, embed_type, emotion_id):
     if input_type == "Choose from examples":
         selected_text = text
     audio_file = f'output/result/EmoV_DB/{selected_text}.wav'
     return audio_file
+input_type = gr.Radio(
+    choices=["Choose from examples", "Enter your own text"], label="Input Type")
+text = gr.Dropdown(choices=predefined_texts, label="Select a text")
+own_text = gr.Textbox(lines=2, label="Enter your own text")
+speaker_id = gr.Slider(minimum=0, maximum=3, step=1, default=0, label="Speaker ID")
+embed_type = gr.Radio(choices=["bert_embed", "emotion_id"], label="Embedding Type")
+emotion_id = gr.Dropdown(choices=list(emotion_mapping.keys()), label="Select Emotion")
 iface = gr.Interface(
     fn=synthesize_speech,
+    inputs=[input_type, text, own_text, speaker_id, embed_type, emotion_id],
+    outputs=gr.Audio(type="filepath"),
     title="Text-to-Speech Demo",
+    description="Select or enter text and configure options to synthesize speech."
 )
 iface.launch()