Spaces:

CsanadT
/

Swedish_ASmR

Build error

adjoint-bass commited on Dec 9, 2022

Commit

e559252

1 Parent(s): 556e022

update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,38 +1,48 @@
 from transformers import pipeline
 import gradio as gr
 from pytube import YouTube
-pipe = pipeline(model = 'CsanadT/whisper-small-se')
-def live_performance(audio):
-    text = pipe(audio)['text']
     return text
-def url_performance(link):
-    yt = YouTube(str(link))
-    audio= yt.streams.filter(only_audio=True).first()
-    text = pipe(audio)['text']
     return text
-with gr.Blocks() as demo:
-    with gr.Tab('Live audio'):
-        iface = gr.Interface(
-            fn=live_performance,
-            inputs=gr.Audio(source="microphone", type="filepath"),
-            outputs="text",
-            title="Whisper Small Swedish",
-            description="Real-time demo for swedish speech recognition using a fine-tuned Whisper small model."
-        )
-    with gr.Tab('Transcription from URL'):
-        iface = gr.Interface(
-            fn=url_performance,
-            inputs=gr.Textbox(label='Paste the UL here'),
-            outputs="text",
-            title="Whisper Small Swedish",
-            description="Real-time demo for swedish speech recognition using a fine-tuned Whisper small model."
-        )
 demo.launch()

 from transformers import pipeline
 import gradio as gr
 from pytube import YouTube
+import os
+pipe = pipeline(model="CsanadT/whisper_small_sv")
+def transcribe_live(audio):
+    text = pipe(audio)["text"]
     return text
+def transcribe_url(url):
+    youtube = YouTube(str(url))
+    audio = youtube.streams.filter(only_audio=True).first().download('yt_video')
+    text = pipe(audio)["text"]
     return text
+def transcribe_file(audio):
+    rate, y = audio
+    text = pipe(y)["text"]
+    return text
+url_demo = gr.Interface(
+    fn = transcribe_url,
+    inputs = "text",
+    outputs = "text",
+    title = "Swedish Whisper",
+    description = "Fine-tuned Whisper model for swedish audio transcription",
+)
+voice_demo = gr.Interface(
+    fn=transcribe_live,
+    inputs=gr.Audio(source="microphone", type="filepath"),
+    outputs="text",
+    title="Whisper Swedish",
+    description="Fine-tuned Whisper model for swedish audio transcription",
+)
+file_demo = gr.Interface(
+    fn = transcribe_file,
+    inputs=gr.Audio(file_count="single"),
+    outputs="text",
+    title="Swedish Whisper",
+    description="Fine-tuned Whisper model for swedish audio transcription",
+)
+demo = gr.TabbedInterface([url_demo, voice_demo, file_demo], ["YouTube Video to Text", "Audio to Text"])
 demo.launch()