Spaces:

esnagy
/

hungarian_speech_transcriber

Runtime error

Edward Nagy commited on Dec 2, 2023

Commit

623ac6b

•

1 Parent(s): dd3ed35

Update video transcription functionality

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,24 +1,38 @@
 from transformers import pipeline
 import gradio as gr
-import moviepy.editor as mp
 import os
 # pipe = pipeline(model="esnagy/whisper-small-hu")
 def transcribe(video_url):
-    video = mp.VideoFileClip(video_url)
     audio = video.audio
     audio_file = "temp_audio.wav"
     audio.write_audiofile(audio_file, codec='pcm_s16le')
     text = "Test text"
     # text = pipe(audio_file)["text"]
-    # Remove temporary audio file after transcription
     os.remove(audio_file)
     return text
 iface = gr.Interface(
-    fn=transcribe,
-    inputs=gr.Textbox(label="Enter video URL"),
     outputs="text",
     title="Whisper Small Hungarian",
     description="Realtime demo for Hungarian speech recognition using a fine-tuned Whisper small model. Enter a video URL to transcribe its audio.",

 from transformers import pipeline
 import gradio as gr
+import requests
+from moviepy.editor import *
 import os
 # pipe = pipeline(model="esnagy/whisper-small-hu")
 def transcribe(video_url):
+    # Download the video from the URL
+    video_filename = "temp_video.mp4"
+    with open(video_filename, 'wb') as f:
+        response = requests.get(video_url)
+        f.write(response.content)
+    # Load the video using moviepy
+    video = VideoFileClip(video_filename)
     audio = video.audio
     audio_file = "temp_audio.wav"
     audio.write_audiofile(audio_file, codec='pcm_s16le')
+    # Transcribe the audio
     text = "Test text"
     # text = pipe(audio_file)["text"]
+    # Remove temporary files
+    os.remove(video_filename)
     os.remove(audio_file)
     return text
 iface = gr.Interface(
+    fn=transcribe,
+    inputs=gr.Textbox(label="Enter video URL"),
     outputs="text",
     title="Whisper Small Hungarian",
     description="Realtime demo for Hungarian speech recognition using a fine-tuned Whisper small model. Enter a video URL to transcribe its audio.",