|
import gradio as gr |
|
import os |
|
from AinaTheme import theme |
|
import phonemizer |
|
from dotenv import load_dotenv |
|
import logging |
|
|
|
load_dotenv() |
|
|
|
MAX_INPUT_TEXT_LEN = int(os.environ.get("MAX_INPUT_TEXT_LEN", default=325)) |
|
|
|
critical_logger = logging.getLogger("phonemizer") |
|
critical_logger.setLevel(logging.CRITICAL) |
|
|
|
|
|
global_phonemizer_central = phonemizer.backend.EspeakBackend( |
|
language="ca", |
|
preserve_punctuation=True, |
|
with_stress=True, |
|
language_switch="remove-flags", |
|
logger=critical_logger, |
|
) |
|
|
|
global_phonemizer_valencia = phonemizer.backend.EspeakBackend( |
|
language="ca-va", |
|
preserve_punctuation=True, |
|
with_stress=True, |
|
language_switch="remove-flags", |
|
logger=critical_logger, |
|
) |
|
|
|
global_phonemizer_occidental = phonemizer.backend.EspeakBackend( |
|
language="ca-nw", |
|
preserve_punctuation=True, |
|
with_stress=True, |
|
language_switch="remove-flags", |
|
logger=critical_logger, |
|
) |
|
|
|
global_phonemizer_balear = phonemizer.backend.EspeakBackend( |
|
language="ca-ba", |
|
preserve_punctuation=True, |
|
with_stress=True, |
|
language_switch="remove-flags", |
|
logger=critical_logger, |
|
) |
|
|
|
global_phonemizer_algueres = phonemizer.backend.EspeakBackend( |
|
language="ca-al", |
|
preserve_punctuation=True, |
|
with_stress=True, |
|
language_switch="remove-flags", |
|
logger=critical_logger, |
|
) |
|
|
|
global_phonemizer_rossellones = phonemizer.backend.EspeakBackend( |
|
language="ca-ro", |
|
preserve_punctuation=True, |
|
with_stress=True, |
|
language_switch="remove-flags", |
|
logger=critical_logger, |
|
) |
|
|
|
def phonemiser(text, dialect): |
|
phonemizers = {"Central": global_phonemizer_central, |
|
"Valencian": global_phonemizer_valencia, |
|
"North-West": global_phonemizer_occidental, |
|
"Balear": global_phonemizer_balear, |
|
"Alguerés": global_phonemizer_algueres, |
|
"Rosellonés": global_phonemizer_rossellones} |
|
|
|
fonemitzador = phonemizers[dialect] |
|
|
|
fonemes = fonemitzador.phonemize([text], strip=True, njobs=1)[0] |
|
return fonemes |
|
|
|
|
|
title = "Transcripció fonètica multidialectal en català️" |
|
description=""" |
|
Transcripció fonètica per a diferents dialectes del català mitjançant eSpeak. |
|
Phonetic transcription for different dialects of Catalan |
|
using eSpeak. |
|
repo: https://github.com/projecte-aina/espeak-ng/tree/dev-ca |
|
""" |
|
|
|
def submit_input(input_, dialect): |
|
output = None |
|
if input_ is not None and len(input_) < MAX_INPUT_TEXT_LEN: |
|
output = phonemiser(input_, dialect) |
|
else: |
|
gr.Warning(f"Your text exceeds the {MAX_INPUT_TEXT_LEN}-character limit.") |
|
return output |
|
|
|
def change_interactive(text): |
|
input_state = text |
|
if input_state.strip() != "": |
|
return gr.update(interactive = True) |
|
else: |
|
return gr.update(interactive = False) |
|
def clean(): |
|
return ( |
|
None, |
|
None, |
|
) |
|
|
|
|
|
|
|
with gr.Blocks(theme=theme) as app: |
|
|
|
gr.Markdown(f"<h1 style='text-align: center; margin-bottom: 1rem'>{title}</h1>") |
|
|
|
gr.Markdown(description) |
|
|
|
with gr.Row(equal_height=False, variant="panel"): |
|
|
|
with gr.Column(variant='panel'): |
|
input_ = gr.Textbox( |
|
label="Text", |
|
value="Les coses importants són les que no ho semblen.", |
|
lines=4 |
|
) |
|
|
|
dialect = gr.Dropdown(label="Dialect", choices=["Central", "Valencian", "North-West", "Balear", "Alguerés", "Rosellonés"], value="Central") |
|
with gr.Row(variant="panel"): |
|
clear_btn = gr.Button( |
|
"Clean", |
|
) |
|
submit_btn = gr.Button( |
|
"Submit", |
|
variant="primary", |
|
) |
|
with gr.Column(variant='panel'): |
|
output = gr.Textbox( |
|
label="Output", |
|
interactive=False, |
|
show_copy_button=True |
|
) |
|
gr.Examples( |
|
label="Examples", |
|
examples=[ |
|
["Les coses importants són les que no ho semblen.", "Central"], |
|
["Les coses importants són les que no ho semblen.", "Valencian",], |
|
["Les coses importants són les que no ho semblen.", "North-West",], |
|
["Les coses importants són les que no ho semblen.","Balear"], |
|
], |
|
inputs=[input_, dialect], |
|
outputs=output, |
|
fn=submit_input) |
|
|
|
for button in [submit_btn, clear_btn]: |
|
input_.change(fn=change_interactive, inputs=[input_], outputs=button, api_name=False) |
|
|
|
clear_btn.click(fn=clean, inputs=[], outputs=[input_, output] , queue=False, api_name=False) |
|
submit_btn.click(fn=submit_input, inputs=[input_, dialect], outputs=output, api_name="get-results", concurrency_limit=2) |
|
|
|
app.launch(show_api=True, server_name="0.0.0.0", server_port=7860) |
|
|