Spaces:

aadnk
/

whisper-webui

Running

App Files Files Community

aadnk commited on Sep 26, 2022

Commit

533d92e

•

1 Parent(s): 4514e2e

Also delete uploaded files to save space

Browse files

Files changed (1) hide show

app.py +38 -27

app.py CHANGED Viewed

@@ -21,6 +21,9 @@ from utils import slugify, write_srt, write_vtt
 # Limitations (set to -1 to disable)
 DEFAULT_INPUT_AUDIO_MAX_DURATION = 600 # seconds
 LANGUAGES = [
  "English", "Chinese", "German", "Spanish", "Russian", "Korean",
  "French", "Japanese", "Portuguese", "Turkish", "Polish", "Catalan",
@@ -49,40 +52,48 @@ class UI:
     def transcribeFile(self, modelName, languageName, urlData, uploadFile, microphoneData, task):
         source, sourceName = getSource(urlData, uploadFile, microphoneData)
-        selectedLanguage = languageName.lower() if len(languageName) > 0 else None
-        selectedModel = modelName if modelName is not None else "base"
-        if self.inputAudioMaxDuration > 0:
-            # Calculate audio length
-            audioDuration = ffmpeg.probe(source)["format"]["duration"]
-            if float(audioDuration) > self.inputAudioMaxDuration:
-                return ("[ERROR]: Maximum audio file length is " + str(self.inputAudioMaxDuration) + "s, file was " + str(audioDuration) + "s"), "[ERROR]"
-        model = model_cache.get(selectedModel, None)
-        if not model:
-            model = whisper.load_model(selectedModel)
-            model_cache[selectedModel] = model
-        # The results
-        result = model.transcribe(source, language=selectedLanguage, task=task)
-        text = result["text"]
-        vtt = getSubs(result["segments"], "vtt")
-        srt = getSubs(result["segments"], "srt")
-        # Files that can be downloaded
-        downloadDirectory = tempfile.mkdtemp()
-        filePrefix = slugify(sourceName, allow_unicode=True)
-        download = []
-        download.append(createFile(srt, downloadDirectory, filePrefix + "-subs.srt"));
-        download.append(createFile(vtt, downloadDirectory, filePrefix + "-subs.vtt"));
-        download.append(createFile(text, downloadDirectory, filePrefix + "-transcript.txt"));
-        return download, text, vtt
 def getSource(urlData, uploadFile, microphoneData):
     if urlData:

 # Limitations (set to -1 to disable)
 DEFAULT_INPUT_AUDIO_MAX_DURATION = 600 # seconds
+# Whether or not to automatically delete all uploaded files, to save disk space
+DELETE_UPLOADED_FILES = True
 LANGUAGES = [
  "English", "Chinese", "German", "Spanish", "Russian", "Korean",
  "French", "Japanese", "Portuguese", "Turkish", "Polish", "Catalan",
     def transcribeFile(self, modelName, languageName, urlData, uploadFile, microphoneData, task):
         source, sourceName = getSource(urlData, uploadFile, microphoneData)
+        try:
+            selectedLanguage = languageName.lower() if len(languageName) > 0 else None
+            selectedModel = modelName if modelName is not None else "base"
+            if self.inputAudioMaxDuration > 0:
+                # Calculate audio length
+                audioDuration = ffmpeg.probe(source)["format"]["duration"]
+                if float(audioDuration) > self.inputAudioMaxDuration:
+                    return ("[ERROR]: Maximum audio file length is " + str(self.inputAudioMaxDuration) + "s, file was " + str(audioDuration) + "s"), "[ERROR]"
+            model = model_cache.get(selectedModel, None)
+            if not model:
+                model = whisper.load_model(selectedModel)
+                model_cache[selectedModel] = model
+            # The results
+            result = model.transcribe(source, language=selectedLanguage, task=task)
+            text = result["text"]
+            vtt = getSubs(result["segments"], "vtt")
+            srt = getSubs(result["segments"], "srt")
+            # Files that can be downloaded
+            downloadDirectory = tempfile.mkdtemp()
+            filePrefix = slugify(sourceName, allow_unicode=True)
+            download = []
+            download.append(createFile(srt, downloadDirectory, filePrefix + "-subs.srt"));
+            download.append(createFile(vtt, downloadDirectory, filePrefix + "-subs.vtt"));
+            download.append(createFile(text, downloadDirectory, filePrefix + "-transcript.txt"));
+            return download, text, vtt
+        finally:
+            # Cleanup source
+            if DELETE_UPLOADED_FILES:
+                print("Deleting source file " + source)
+                os.remove(source)
 def getSource(urlData, uploadFile, microphoneData):
     if urlData: