Spaces:

salmanmapkar
/

audio-video-transcriber

Runtime error

salmanmapkar commited on Dec 25, 2022

Commit

83cf0f6

•

1 Parent(s): c757073

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ import moviepy.editor as mp
 import datetime
 import torch
 import pyannote.audio
-from pyannote.audio.pipelines.speaker_verification import PyannoteAudioPretrainedSpeakerEmbedding
 from pyannote.audio import Audio
 from pyannote.core import Segment
 import wave
@@ -141,11 +141,11 @@ def Transcribe_V1(NumberOfSpeakers, SpeakerNames="", audio="temp_audio.wav"):
 def Transcribe_V2(num_speakers, speaker_names, audio="temp_audio.wav"):
     model = whisper.load_model("medium")
-    embedding_model = PyannoteAudioPretrainedSpeakerEmbedding("pyannote/embedding",use_auth_token="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")
-    # embedding_model = PretrainedSpeakerEmbedding(
-    #     "speechbrain/spkrec-ecapa-voxceleb",
-    #     device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-    # )
     SPEAKER_DICT = {}
     SPEAKERS = [speaker.strip() for speaker in speaker_names.split(',') if len(speaker)]
     def GetSpeaker(sp):

 import datetime
 import torch
 import pyannote.audio
+from pyannote.audio.pipelines.speaker_verification import SpeechBrainPretrainedSpeakerEmbedding #PyannoteAudioPretrainedSpeakerEmbedding
 from pyannote.audio import Audio
 from pyannote.core import Segment
 import wave
 def Transcribe_V2(num_speakers, speaker_names, audio="temp_audio.wav"):
     model = whisper.load_model("medium")
+    # embedding_model = SpeechBrainPretrainedSpeakerEmbedding("speechbrain/spkrec-ecapa-voxceleb")
+    embedding_model = SpeechBrainPretrainedSpeakerEmbedding(
+        "speechbrain/spkrec-ecapa-voxceleb",
+        device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    )
     SPEAKER_DICT = {}
     SPEAKERS = [speaker.strip() for speaker in speaker_names.split(',') if len(speaker)]
     def GetSpeaker(sp):