File size: 1,083 Bytes
21ad639
 
 
 
 
 
 
 
 
077c8f8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21ad639
 
 
 
077c8f8
21ad639
 
077c8f8
6902e90
077c8f8
 
 
6902e90
077c8f8
 
 
 
ac5a7ce
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
from transformers import pipeline
import gradio as gr

pipe = pipeline(model="Yuyang2022/yue")  # change to "your-username/the-name-you-picked"

def transcribe(audio):
    text = pipe(audio)["text"]
    return text

def transcribe_video(link):
    video=link
    data=pytube.YouTube(video)
    audio=data.streams.get_audio_only()
    audio.download()

    pattern=r".mp4$"
    content=os.listdir()
    for i in content:
        if re.search(pattern,i) is not None:
            video=i
    
    text = pipe(video)["text"]
    return text

iface1 = gr.Interface(
    fn=transcribe, 
    inputs=gr.Audio(source="microphone", type="filepath"), 
    outputs="text",
    title="Whisper Base",
    description="Realtime demo for  speech recognition using a fine-tuned Whisper-base model.",
)

iface2 = gr.Interface(
    fn=transcribe_video, 
    inputs=gr.Textbox(label="Youtube Link",placeholder="Youtube Link"), 
    outputs=["text"],
    title="Whisper Base",
    description="Asynchronous demo for youtube speech recognition using a fine-tuned Whisper-base model.",
)



iface1.launch()