import gradio as gr
from transformers import pipeline

trans = pipeline("automatic-speech-recognition", model = "openai/whisper-small")


def audio2text(audio):
  text = trans(audio)["text"]
  return text

gr.Interface(
    fn=audio2text,
    inputs = [gr.Audio(source="microphone", type="filepath")],
    outputs=["textbox"]
).launch()