from transformers import pipeline | |
import gradio as gr | |
pipe = pipeline(model="Phong1807/whisper-datn11") # change to "your-username/the-name-you-picked" | |
def transcribe(audio): | |
text = pipe(audio)["text"] | |
return text | |
iface = gr.Interface( | |
fn=transcribe, | |
inputs=gr.Audio(type="filepath"), # Remove the 'source' argument | |
outputs="text", | |
title="Whisper Small Vietnamese", | |
description="Realtime demo for Vietnamese speech recognition using a fine-tuned Whisper small model.", | |
) | |
iface.launch(inline = False) |