File size: 617 Bytes
230fca6
8c24f20
230fca6
22ee534
230fca6
 
 
ca46f4b
 
d7a46b2
 
 
 
230fca6
 
22ee534
4234f9a
230fca6
 
 
 
 
22ee534
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
from transformers import pipeline
from moviepy.editor import *
import gradio as gr
import requests

pipe = pipeline(model="kk90ujhun/whisper-small-hi")  # change to "your-username/the-name-you-picked"

def transcribe(my_video):
    # my_video = requests.get(my_url)
    # my_audio = my_video.audio
    # text = pipe(my_audio)["text"]
    # return text
    return type(my_video)

iface = gr.Interface(
    fn=transcribe, 
    inputs=gr.Video(), 
    outputs="text",
    title="Whisper Small Hindi",
    description="Realtime demo for Hindi speech recognition using a fine-tuned Whisper small model.",
)

iface.launch()