Spaces:

aseifert
/

ffpub-transcription

Runtime error

App Files Files Community

Alexander Seifert commited on Jan 19, 2023

Commit

6e406cd

•

1 Parent(s): 721a7b8

add url option

Browse files

Files changed (1) hide show

app.py +14 -19

app.py CHANGED Viewed

@@ -84,38 +84,32 @@ def transcribe(audio=None, url=None):
     return response["modelOutputs"][0]
-def run_demo(password, microphone, file_upload):
     if password not in [os.environ["PASSWORD"], os.environ["ROOT_PASSWORD"]]:
         raise gr.Error("Der Zugriffscode ist falsch.")
-    if (microphone is not None) and (file_upload is not None):
         logger.warning(
-            "Achtung: Sie haben sowohl eine Datei hochgeladen als auch über das Mikrofon aufgenommen."
             " Wir verwenden nur die Datei, die Sie hochgeladen haben."
         )
-    elif (microphone is None) and (file_upload is None):
         raise gr.Error(
-            "Sie müssen entweder eine Datei hochladen oder über das Mikrofon aufnehmen."
         )
-    file = microphone if microphone is not None else file_upload
     start = time.time()
-    cutoff = None if password == os.environ["ROOT_PASSWORD"] else 60_000
-    transcription = transcribe(AudioSegment.from_file(file)[:cutoff])
-    segments = []
-    for seg in transcription["segments"]:
-        text = seg["text"].strip()
-        if not segments or segments[-1].text[-1] in ".:?!":
-            segments.append(Segment(text, seg["start"], seg["end"]))
-        else:
-            segments[-1].text += " " + text
     logger.info(f"transcription took {time.time()-start:.3f}s")
-    return "\n\n".join(str(s) for s in segments)
 demo = gr.Interface(
@@ -123,7 +117,8 @@ demo = gr.Interface(
     inputs=[
         # gr.Textbox(label="Email", type="email"),
         gr.Textbox(label="Zugriffscode (siehe oben)"),
-        gr.Audio(source="microphone", type="filepath", label="Aufnehmen"),
         gr.Audio(source="upload", type="filepath", label="Datei hochladen"),
     ],
     outputs=gr.Textbox(label="Automatisches Transkript"),

     return response["modelOutputs"][0]
+def run_demo(password, url, file_upload):
     if password not in [os.environ["PASSWORD"], os.environ["ROOT_PASSWORD"]]:
         raise gr.Error("Der Zugriffscode ist falsch.")
+    if (url is not None) and (file_upload is not None):
         logger.warning(
+            "Achtung: Sie haben sowohl eine URL angegeben als auch eine Datei hochgeladen."
             " Wir verwenden nur die Datei, die Sie hochgeladen haben."
         )
+    elif (url is None) and (file_upload is None):
         raise gr.Error(
+            "Sie müssen entweder eine URL angeben oder eine Datei hochladen."
         )
     start = time.time()
+    if file_upload is not None:
+        cutoff = None if password == os.environ["ROOT_PASSWORD"] else 60_000
+        audio = AudioSegment.from_file(file_upload, format="mp3")[:cutoff]
+        transcription = transcribe(audio=audio, url=None)
+    else:
+        transcription = transcribe(audio=None, url=url)
     logger.info(f"transcription took {time.time()-start:.3f}s")
+    return transcription["text"]
 demo = gr.Interface(
     inputs=[
         # gr.Textbox(label="Email", type="email"),
         gr.Textbox(label="Zugriffscode (siehe oben)"),
+        # gr.Audio(source="microphone", type="filepath", label="Aufnehmen"),
+        gr.Textbox(label="URL (z.B. YouTube-Video, Dropbox-Datei, etc.)"),
         gr.Audio(source="upload", type="filepath", label="Datei hochladen"),
     ],
     outputs=gr.Textbox(label="Automatisches Transkript"),