Spaces:

aseifert
/

ffpub-transcription

Runtime error

File size: 2,965 Bytes

8fc7f5c
e414a67
b602cc6
8fc7f5c
a9bf4b2
 
8fc7f5c
56cc953
8fc7f5c
a9bf4b2
 
 
 
 
e414a67
8930d8d
 
a9bf4b2
 
e414a67
 
 
 
 
 
 
 
a9bf4b2
e414a67
 
 
 
 
 
a9bf4b2
e414a67
 
 
 
 
 
 
 
 
 
 
 
 
d8a8864
 
e414a67
 
 
a9bf4b2
 
8930d8d
e414a67
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8930d8d
e414a67
a9bf4b2
 
e414a67
 
 
 
 
 
 
a9bf4b2
 
5d9101b

import base64
import json
import os

import modal
import streamlit as st
from loguru import logger
from pydub import AudioSegment

run_transcription = modal.lookup("ffpub-transcription", "run_transcription")

st.set_page_config(page_title="Speech to Text Transcription App")


@st.cache(show_spinner=False)
def transcribe(url, audio_b64, cutoff):
    return run_transcription.call(url=url, audio_b64=audio_b64, cutoff=None)


def password_is_correct(password):
    return password in [os.environ["PASSWORD"], os.environ["ROOT_PASSWORD"]]


def input_is_ready(password, audio_file, url):
    return password_is_correct(password) and (audio_file or url)


def run():
    submit_button = False
    if "is_expanded" not in st.session_state:
        st.session_state["is_expanded"] = True

    # expander = st.expander("Einstellungen", expanded=st.session_state["is_expanded"])
    # with expander:
    password = st.text_input("Zugriffscode (siehe oben)")
    url = audio_file = None

    col1, col2 = st.columns([1, 3])
    type = col1.radio("", ["URL", "Datei-Upload"])
    if type == "URL":
        url = col2.text_input(
            "URL (e.g. YouTube video, Dropbox file, etc.)",
            value="",
        )
    else:
        audio_file = col2.file_uploader(
            "Datei auswählen", type=[".wav", ".mp3", ".flac", ".m4a", ".ogg"]
        )

    submit_button = col2.button(
        label="⚡ Transkribieren"
        + (" (Zugriffscode inkorrekt)" if not password_is_correct(password) else ""),
        disabled=(not password_is_correct(password) or (not audio_file and not url)),
    )

    cutoff = audio_b64 = None
    if audio_file or url:
        with st.expander("Medien-Preview"):
            if audio_file:
                st.audio(audio_file)
                cutoff = None if password == os.environ["ROOT_PASSWORD"] else 60_000
                audio_file = AudioSegment.from_file(audio_file)[:cutoff]
                audio_b64 = base64.b64encode(audio_file.export().read()).decode("ascii")
            if url:
                st.video(url)

    if input_is_ready(password, audio_file, url) and submit_button:
        # my_bar = st.progress(0)
        # for percent_complete in range(100):
        #     time.sleep(1)
        #     my_bar.progress(percent_complete + 1)

        with st.spinner("Transkription läuft..."):
            transcription = transcribe(url, audio_b64, cutoff)

        for seg in transcription["text"].split("\n\n"):
            st.write(seg)

        st.download_button(
            label="OTR-Datei herunterladen",
            data=json.dumps(transcription["otr"], indent=2, ensure_ascii=False),
            file_name="transkript.otr",
            mime="application/json",
        )


try:
    run()
except Exception as e:
    logger.error(e)
    st.error(
        "Leider ist ein unerwarter Fehler aufgetreten. Ich könnte mir das Problem sofort ansehen, Sie erreichen mich unter alexander.seifert@gmail.com"
    )