whisper-webui-translate

Running

avans06 commited on Dec 17, 2023

Commit

2def7a1

1 Parent(s): ec7cc5c

Fixed the issues with Whisper unexpected keyword and original.srt format:

1. Fixed the issue with WhisperModel.transcribe() got an unexpected keyword argument 'whisperSegmentsFilter'.

2. Fixed the problem with the incorrect format of the generated original language (original.srt) subtitle file when the translation model is enabled.

Files changed (2) hide show

app.py +8 -6
src/utils.py +5 -6

app.py CHANGED Viewed

@@ -255,7 +255,7 @@ class WhisperTranscriber:
             self.whisperSegmentsFilters: List[List] = []
             inputFilter: bool = decodeOptions.pop("whisperSegmentsFilter", None)
             inputFilters = []
-            for idx in range(0,len(self.app_config.whisper_segments_filters),1):
                 inputFilters.append(decodeOptions.pop(f"whisperSegmentsFilter{idx}", None))
             inputFilters = filter(None, inputFilters)
             if inputFilter:
@@ -1064,12 +1064,12 @@ def create_ui(app_config: ApplicationConfig):
             with gr.Column():
                 simpleOutput = common_output()
         gr.Markdown(uiArticle)
-        if translateModelMd is not None:
-            with gr.Accordion("docs/translateModel.md", open=False):
-                gr.Markdown(translateModelMd)
         if optionsMd is not None:
             with gr.Accordion("docs/options.md", open=False):
                 gr.Markdown(optionsMd)
         if readmeMd is not None:
             with gr.Accordion("README.md", open=False):
                 gr.Markdown(readmeMd)
@@ -1158,11 +1158,13 @@ def create_ui(app_config: ApplicationConfig):
                         fullInputDict.update(common_translation_inputs())
             with gr.Column():
                 fullOutput = common_output()
-        with gr.Accordion("Article"):
-            gr.Markdown(uiArticle)
         if optionsMd is not None:
             with gr.Accordion("docs/options.md", open=False):
                 gr.Markdown(optionsMd)
         if readmeMd is not None:
             with gr.Accordion("README.md", open=False):
                 gr.Markdown(readmeMd)

             self.whisperSegmentsFilters: List[List] = []
             inputFilter: bool = decodeOptions.pop("whisperSegmentsFilter", None)
             inputFilters = []
+            for idx in range(1,len(self.app_config.whisper_segments_filters) + 1,1):
                 inputFilters.append(decodeOptions.pop(f"whisperSegmentsFilter{idx}", None))
             inputFilters = filter(None, inputFilters)
             if inputFilter:
             with gr.Column():
                 simpleOutput = common_output()
         gr.Markdown(uiArticle)
         if optionsMd is not None:
             with gr.Accordion("docs/options.md", open=False):
                 gr.Markdown(optionsMd)
+        if translateModelMd is not None:
+            with gr.Accordion("docs/translateModel.md", open=False):
+                gr.Markdown(translateModelMd)
         if readmeMd is not None:
             with gr.Accordion("README.md", open=False):
                 gr.Markdown(readmeMd)
                         fullInputDict.update(common_translation_inputs())
             with gr.Column():
                 fullOutput = common_output()
+        gr.Markdown(uiArticle)
         if optionsMd is not None:
             with gr.Accordion("docs/options.md", open=False):
                 gr.Markdown(optionsMd)
+        if translateModelMd is not None:
+            with gr.Accordion("docs/translateModel.md", open=False):
+                gr.Markdown(translateModelMd)
         if readmeMd is not None:
             with gr.Accordion("README.md", open=False):
                 gr.Markdown(readmeMd)

src/utils.py CHANGED Viewed

@@ -133,12 +133,11 @@ def write_srt_original(transcript: Iterator[dict], file: TextIO,
         if original is not None: print(f"{original}",
             file=file,
             flush=True)
-        if bilingual:
-            text = segment['text'].replace('-->', '->')
-            print(f"{text}\n",
-            file=file,
-            flush=True)
 def __subtitle_preprocessor_iterator(transcript: Iterator[dict], maxLineWidth: int = None, highlight_words: bool = False):
     for segment in transcript:

         if original is not None: print(f"{original}",
             file=file,
             flush=True)
+        text = segment['text'].replace('-->', '->')
+        print(f"{text}\n" if bilingual else "",
+        file=file,
+        flush=True)
 def __subtitle_preprocessor_iterator(transcript: Iterator[dict], maxLineWidth: int = None, highlight_words: bool = False):
     for segment in transcript: