import gradio as gr
from transformers import pipeline


model = pipeline(task="automatic-speech-recognition",

def predict_speech_to_text(audio):
    prediction = model(audio)
    text = prediction['text']
    return text

gr.Interface.load("models/facebook/s2t-medium-librispeech-asr")               
gr.Interface(fn=predict_speech_to_text,
             title="🧑🏽‍🎤 PROLOVE 🥰😘 ",
             inputs=gr.inputs.Audio(
                 source="microphone", type="filepath", label="Input"),
             outputs=gr.outputs.Textbox(label="Output"),
             description="This application was created to help correct pronouncation",
             examples=['Good night_alvi.wav'],
             allow_flagging='never'
             ).launch()