import gradio as gr import time from transformers import pipeline p = pipeline("automatic-speech-recognition", model="abdouaziiz/wav2vec2-xls-r-300m-wolof-lm") def transcribe(audio, state=""): """Une fonction pour transformer un audio en Wolof en Text.""" time.sleep(3) text = p(audio)["text"] state += text + " " return state, state iface = gr.Interface( fn=transcribe, inputs = [ gr.inputs.Audio(source="microphone", type="filepath"), "state" ], outputs = [ "textbox", "state" ], live=True ) iface.launch(inline = False)