Whisper-Auto-Subtitled-Video-Generator

Paused

App Files Files Community

BatuhanYilmaz commited on Nov 6, 2022

Commit

9aaeafd

•

1 Parent(s): f33d1e7

.

Browse files

Files changed (3) hide show

pages/02_📼_Upload_Video_File.py +5 -14
pages/03_📝_Upload_Video_File_and_Transcript.py +0 -137
pages/{04_🔊_Upload_Audio_File.py → 03_🔊_Upload_Audio_File.py} +4 -13

pages/02_📼_Upload_Video_File.py CHANGED Viewed

@@ -9,8 +9,6 @@ from io import StringIO
 import numpy as np
 import pathlib
 import os
-import components.authenticate as authenticate
-import torch
 st.set_page_config(page_title="Auto Subtitled Video Generator", page_icon=":movie_camera:", layout="wide")
@@ -51,10 +49,8 @@ with col2:
 @st.cache(allow_output_mutation=True)
 def change_model(current_size, size):
-    torch.cuda.is_available()
-    DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
     if current_size != size:
-        loaded_model = whisper.load_model(size, device=DEVICE)
         return loaded_model
     else:
         raise Exception("Model size is the same as the current size.")
@@ -102,7 +98,7 @@ def getSubs(segments: Iterator[dict], format: str, maxLineWidth: int) -> str:
 def generate_subtitled_video(video, audio, transcript):
     video_file = ffmpeg.input(video)
     audio_file = ffmpeg.input(audio)
-    ffmpeg.concat(video_file.filter("subtitles", transcript), audio_file, v=1, a=1).output("final.mp4").global_args('-report').run(quiet=True, overwrite_output=True)
     video_with_subs = open("final.mp4", "rb")
     return video_with_subs
@@ -112,7 +108,7 @@ def main():
     loaded_model = change_model(current_size, size)
     st.write(f"Model is {'multilingual' if loaded_model.is_multilingual else 'English-only'} "
         f"and has {sum(np.prod(p.shape) for p in loaded_model.parameters()):,} parameters.")
-    input_file = st.file_uploader("Upload Video File", type=["mp4", "avi", "mov", "mkv"])
     # get the name of the input_file
     if input_file is not None:
         filename = input_file.name[:-4]
@@ -230,10 +226,5 @@ def main():
 if __name__ == "__main__":
-    authenticate.set_st_state_vars()
-    if st.session_state["authenticated"]:
-        main()
-        authenticate.button_logout()
-    else:
-        st.info("Please log in or sign up to use the app.")
-        authenticate.button_login()

 import numpy as np
 import pathlib
 import os
 st.set_page_config(page_title="Auto Subtitled Video Generator", page_icon=":movie_camera:", layout="wide")
 @st.cache(allow_output_mutation=True)
 def change_model(current_size, size):
     if current_size != size:
+        loaded_model = whisper.load_model(size)
         return loaded_model
     else:
         raise Exception("Model size is the same as the current size.")
 def generate_subtitled_video(video, audio, transcript):
     video_file = ffmpeg.input(video)
     audio_file = ffmpeg.input(audio)
+    ffmpeg.concat(video_file.filter("subtitles", transcript), audio_file, v=1, a=1).output("final.mp4").run(quiet=True, overwrite_output=True)
     video_with_subs = open("final.mp4", "rb")
     return video_with_subs
     loaded_model = change_model(current_size, size)
     st.write(f"Model is {'multilingual' if loaded_model.is_multilingual else 'English-only'} "
         f"and has {sum(np.prod(p.shape) for p in loaded_model.parameters()):,} parameters.")
+    input_file = st.file_uploader("File", type=["mp4", "avi", "mov", "mkv"])
     # get the name of the input_file
     if input_file is not None:
         filename = input_file.name[:-4]
 if __name__ == "__main__":
+    main()
+    st.markdown("###### Made with :heart: by [@BatuhanYılmaz](https://twitter.com/batuhan3326) [![this is an image link](https://i.imgur.com/thJhzOO.png)](https://www.buymeacoffee.com/batuhanylmz)")

pages/03_📝_Upload_Video_File_and_Transcript.py DELETED Viewed

@@ -1,137 +0,0 @@
-import streamlit as st
-from streamlit_lottie import st_lottie
-from utils import write_vtt, write_srt
-import ffmpeg
-import requests
-from typing import Iterator
-from io import StringIO
-import numpy as np
-import pathlib
-import os
-import components.authenticate as authenticate
-st.set_page_config(page_title="Auto Subtitled Video Generator", page_icon=":movie_camera:", layout="wide")
-# Define a function that we can use to load lottie files from a link.
-@st.cache(allow_output_mutation=True)
-def load_lottieurl(url: str):
-    r = requests.get(url)
-    if r.status_code != 200:
-        return None
-    return r.json()
-APP_DIR = pathlib.Path(__file__).parent.absolute()
-LOCAL_DIR = APP_DIR / "local_transcript"
-LOCAL_DIR.mkdir(exist_ok=True)
-save_dir = LOCAL_DIR / "output"
-save_dir.mkdir(exist_ok=True)
-col1, col2 = st.columns([1, 3])
-with col1:
-    lottie = load_lottieurl("https://assets6.lottiefiles.com/packages/lf20_cjnxwrkt.json")
-    st_lottie(lottie)
-with col2:
-    st.write("""
-    ## Auto Subtitled Video Generator
-    ##### ➠ Upload a video file and a transcript as .srt or .vtt file and get a video with subtitles.
-    ##### ➠ Processing time will increase as the video length increases. """)
-def getSubs(segments: Iterator[dict], format: str, maxLineWidth: int) -> str:
-    segmentStream = StringIO()
-    if format == 'vtt':
-        write_vtt(segments, file=segmentStream, maxLineWidth=maxLineWidth)
-    elif format == 'srt':
-        write_srt(segments, file=segmentStream, maxLineWidth=maxLineWidth)
-    else:
-        raise Exception("Unknown format " + format)
-    segmentStream.seek(0)
-    return segmentStream.read()
-def split_video_audio(uploaded_file):
-    with open(f"{save_dir}/input.mp4", "wb") as f:
-            f.write(uploaded_file.read())
-    audio = ffmpeg.input(f"{save_dir}/input.mp4")
-    audio = ffmpeg.output(audio, f"{save_dir}/output.wav", acodec="pcm_s16le", ac=1, ar="16k")
-    ffmpeg.run(audio, overwrite_output=True)
-def main():
-    uploaded_video = st.file_uploader("Upload Video File", type=["mp4", "avi", "mov", "mkv"])
-    # get the name of the input_file
-    if uploaded_video is not None:
-        filename = uploaded_video.name[:-4]
-    else:
-        filename = None
-    transcript_file = st.file_uploader("Upload Transcript File", type=["srt", "vtt"])
-    if transcript_file is not None:
-        transcript_name = transcript_file.name
-    else:
-        transcript_name = None
-    if uploaded_video is not None and transcript_file is not None:
-        if transcript_name[-3:] == "vtt":
-            with open("uploaded_transcript.vtt", "wb") as f:
-                f.writelines(transcript_file)
-                f.close()
-            with open(os.path.join(os.getcwd(), "uploaded_transcript.vtt"), "rb") as f:
-                vtt_file = f.read()
-            if st.button("Generate Video with Subtitles"):
-                with st.spinner("Generating Subtitled Video"):
-                    split_video_audio(uploaded_video)
-                    video_file = ffmpeg.input(f"{save_dir}/input.mp4")
-                    audio_file = ffmpeg.input(f"{save_dir}/output.wav")
-                    ffmpeg.concat(video_file.filter("subtitles", "uploaded_transcript.vtt"), audio_file, v=1, a=1).output("final.mp4").global_args('-report').run(quiet=True, overwrite_output=True)
-                    video_with_subs = open("final.mp4", "rb")
-                col3, col4 = st.columns(2)
-                with col3:
-                    st.video(uploaded_video)
-                with col4:
-                    st.video(video_with_subs)
-                st.download_button(label="Download Video with Subtitles",
-                                    data=video_with_subs,
-                                    file_name=f"{filename}_with_subs.mp4")
-        elif transcript_name[-3:] == "srt":
-            with open("uploaded_transcript.srt", "wb") as f:
-                f.writelines(transcript_file)
-                f.close()
-            with open(os.path.join(os.getcwd(), "uploaded_transcript.srt"), "rb") as f:
-                srt_file = f.read()
-            if st.button("Generate Video with Subtitles"):
-                with st.spinner("Generating Subtitled Video"):
-                    split_video_audio(uploaded_video)
-                    video_file = ffmpeg.input(f"{save_dir}/input.mp4")
-                    audio_file = ffmpeg.input(f"{save_dir}/output.wav")
-                    ffmpeg.concat(video_file.filter("subtitles",  "uploaded_transcript.srt"), audio_file, v=1, a=1).output("final.mp4").run(quiet=True, overwrite_output=True)
-                    video_with_subs = open("final.mp4", "rb")
-                col3, col4 = st.columns(2)
-                with col3:
-                    st.video(uploaded_video)
-                with col4:
-                    st.video(video_with_subs)
-                st.download_button(label="Download Video with Subtitles",
-                                    data=video_with_subs,
-                                    file_name=f"{filename}_with_subs.mp4")
-        else:
-            st.error("Please upload a .srt or .vtt file")
-    else:
-        st.info("Please upload a video file and a transcript file")
-if __name__ == "__main__":
-    authenticate.set_st_state_vars()
-    if st.session_state["authenticated"]:
-        main()
-        authenticate.button_logout()
-    else:
-        st.info("Please log in or sign up to use the app.")
-        authenticate.button_login()

pages/{04_🔊_Upload_Audio_File.py → 03_🔊_Upload_Audio_File.py} RENAMED Viewed

@@ -9,8 +9,6 @@ from io import StringIO
 import numpy as np
 import pathlib
 import os
-import components.authenticate as authenticate
-import torch
 st.set_page_config(page_title="Auto Transcriber", page_icon="🔊", layout="wide")
@@ -50,10 +48,8 @@ current_size = "None"
 @st.cache(allow_output_mutation=True)
 def change_model(current_size, size):
-    torch.cuda.is_available()
-    DEVICE = "cuda" if torch.cuda.is_available() else "cpu"
     if current_size != size:
-        loaded_model = whisper.load_model(size, device=DEVICE)
         return loaded_model
     else:
         raise Exception("Model size is the same as the current size.")
@@ -102,7 +98,7 @@ def main():
     loaded_model = change_model(current_size, size)
     st.write(f"Model is {'multilingual' if loaded_model.is_multilingual else 'English-only'} "
         f"and has {sum(np.prod(p.shape) for p in loaded_model.parameters()):,} parameters.")
-    input_file = st.file_uploader("Upload Audio File", type=["mp3", "wav", "m4a"])
     if input_file is not None:
         filename = input_file.name[:-4]
     else:
@@ -205,10 +201,5 @@ def main():
 if __name__ == "__main__":
-    authenticate.set_st_state_vars()
-    if st.session_state["authenticated"]:
-        main()
-        authenticate.button_logout()
-    else:
-        st.info("Please log in or sign up to use the app.")
-        authenticate.button_login()

 import numpy as np
 import pathlib
 import os
 st.set_page_config(page_title="Auto Transcriber", page_icon="🔊", layout="wide")
 @st.cache(allow_output_mutation=True)
 def change_model(current_size, size):
     if current_size != size:
+        loaded_model = whisper.load_model(size)
         return loaded_model
     else:
         raise Exception("Model size is the same as the current size.")
     loaded_model = change_model(current_size, size)
     st.write(f"Model is {'multilingual' if loaded_model.is_multilingual else 'English-only'} "
         f"and has {sum(np.prod(p.shape) for p in loaded_model.parameters()):,} parameters.")
+    input_file = st.file_uploader("Upload an audio file", type=["mp3", "wav", "m4a"])
     if input_file is not None:
         filename = input_file.name[:-4]
     else:
 if __name__ == "__main__":
+    main()
+    st.markdown("###### Made with :heart: by [@BatuhanYılmaz](https://twitter.com/batuhan3326) [![this is an image link](https://i.imgur.com/thJhzOO.png)](https://www.buymeacoffee.com/batuhanylmz)")