Spaces:

salmanmapkar
/

audio-video-transcriber

Runtime error

salmanmapkar commited on Dec 24, 2022

Commit

65e44dc

•

1 Parent(s): eb1e73b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -25,7 +25,6 @@ import contextlib
 from sklearn.cluster import AgglomerativeClustering
 import numpy as np
 __FILES = set()
@@ -104,7 +103,7 @@ def Transcribe_V1(NumberOfSpeakers, SpeakerNames="", audio="temp_audio.wav"):
         return f"dz_{audio}.wav", dzList, segments
     def transcribe(dz_audio):
-        model = whisper.load_model("medium")
         result = model.transcribe(dz_audio)
         # for _ in result['segments']:
         #     print(_['start'], _['end'], _['text'])
@@ -139,7 +138,7 @@ def Transcribe_V1(NumberOfSpeakers, SpeakerNames="", audio="temp_audio.wav"):
 def Transcribe_V2(num_speakers, speaker_names, audio="temp_audio.wav"):
-    model = whisper.load_model("large")
     embedding_model = PretrainedSpeakerEmbedding(
         "speechbrain/spkrec-ecapa-voxceleb",
         device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

 from sklearn.cluster import AgglomerativeClustering
 import numpy as np
 __FILES = set()
         return f"dz_{audio}.wav", dzList, segments
     def transcribe(dz_audio):
+        model = whisper.load_model("large_v2")
         result = model.transcribe(dz_audio)
         # for _ in result['segments']:
         #     print(_['start'], _['end'], _['text'])
 def Transcribe_V2(num_speakers, speaker_names, audio="temp_audio.wav"):
+    model = whisper.load_model("large_v2")
     embedding_model = PretrainedSpeakerEmbedding(
         "speechbrain/spkrec-ecapa-voxceleb",
         device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')