Spaces:

theodotus
/

ukrainian-voices

Running

theodotus commited on Sep 11, 2022

Commit

fe5a4b7

•

1 Parent(s): a147249

Added accentification

Files changed (2) hide show

accentor.py ADDED Viewed

+from ukrainian_word_stress import Stressifier, StressSymbol
+from ukrainian_accentor_transformer import Accentor
+accentors = ["model", "vocab", "none"]
+def stress_replace_and_shift(stressed: str):
+    stressed = stressed.replace(
+        StressSymbol.CombiningAcuteAccent, "+"
+    )
+    new_stressed = ""
+    start = 0
+    last = 0
+    # shift stress symbol by one "при+віт" -> "пр+ивіт"
+    while True:
+        plus_position = stressed.find("+", start)
+        if plus_position != -1:
+            new_stressed += (
+                stressed[last : plus_position - 1] + "+" + stressed[plus_position - 1]
+            )
+            start = plus_position + 1
+            last = start
+        else:
+            new_stressed += stressed[last:]
+            break
+    return new_stressed
+stressify = Stressifier(stress_symbol=StressSymbol.CombiningAcuteAccent)
+accentor_transformer = Accentor()
+def accentification(sentence: str, mode: str):
+    sentence = sentence.replace("+", "")
+    sentence = sentence.replace(
+        StressSymbol.CombiningAcuteAccent, ""
+    )
+    if (mode == "vocab"):
+        accented_sentence = stressify(sentence)
+    elif (mode == "model"):
+        accented_sentence = accentor_transformer(sentence)
+    else:
+        accented_sentence = sentence
+    return accented_sentence

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ from torch import no_grad, package
 import ctypes
 import gc
 config = {
@@ -38,14 +39,18 @@ def init_models():
     return models
-def tts(text: str, voice: str):
     synt = models[voice]
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         with no_grad():
-            wav_data = synt.tts(text, **tts_kwargs)
             synt.save_wav(wav_data, fp)
             trim_memory()
-        return fp.name
@@ -58,15 +63,23 @@ iface = gr.Interface(
     inputs=[
         gr.Textbox(
             label="Input",
-            value="К+ам'ян+ець-Под+ільський - м+істо в Хмельн+ицькій +області Укра+їни, ц+ентр Кам'ян+ець-Под+ільської міськ+ої об'+єднаної територі+альної гром+ади +і Кам'ян+ець-Под+ільського рай+ону.",
         ),
         gr.Radio(
             label="Voice",
             choices=voices,
             value=voices[0],
         ),
     ],
-    outputs=gr.Audio(label="Output"),
     title="🇺🇦 - Ukrainian Voices",
 )

 import ctypes
 import gc
+from accentor import accentification, stress_replace_and_shift, accentors
 config = {
     return models
+def tts(text: str, voice: str, mode: str):
+    # accentor
+    accented_text = accentification(text, mode)
+    plussed_text = stress_replace_and_shift(accented_text)
+    # TTS
     synt = models[voice]
     with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as fp:
         with no_grad():
+            wav_data = synt.tts(plussed_text, **tts_kwargs)
             synt.save_wav(wav_data, fp)
             trim_memory()
+        return fp.name, accented_text
     inputs=[
         gr.Textbox(
             label="Input",
+            value="Кам'янець-Подільський - місто в Хмельницькій області України, центр Кам'янець-Подільської міської об'єднаної територіальної громади і Кам'янець-Подільського району.",
         ),
         gr.Radio(
             label="Voice",
             choices=voices,
             value=voices[0],
         ),
+        gr.Radio(
+            label="Accentor",
+            choices=accentors,
+            value=accentors[0],
+        ),
+    ],
+    outputs=[
+        gr.Audio(label="Output"),
+        gr.Textbox(label="Stressed")
     ],
     title="🇺🇦 - Ukrainian Voices",
 )