on1onmangoes commited on
Commit
8e06021
1 Parent(s): 2e4be4a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -3
app.py CHANGED
@@ -10,11 +10,15 @@ from pyannote.audio import Audio
10
  from pyannote.core import Segment
11
  import gradio as gr
12
 
 
13
  import yt_dlp as youtube_dl
14
  from gradio_client import Client
15
- from pyannote.audio import Pipeline
16
  from transformers.pipelines.audio_utils import ffmpeg_read
17
 
 
 
 
 
18
  HF_TOKEN = "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"
19
  # set up the diarization pipeline
20
  diarization_pipeline = Pipeline.from_pretrained("pyannote/speaker-diarization-3.0", use_auth_token=HF_TOKEN)
@@ -30,8 +34,12 @@ def transcribe(audio_path, task="transcribe", group_by_speaker=True, progress=gr
30
 
31
  # run diarization while we wait for Whisper JAX
32
  progress(0, desc="Diarizing...")
33
- diarization = diarization_pipeline(audio_path)
34
- segments = diarization.for_json()["content"]
 
 
 
 
35
 
36
  transcription = segments
37
 
 
10
  from pyannote.core import Segment
11
  import gradio as gr
12
 
13
+
14
  import yt_dlp as youtube_dl
15
  from gradio_client import Client
 
16
  from transformers.pipelines.audio_utils import ffmpeg_read
17
 
18
+ import pyannote.core.json
19
+
20
+
21
+
22
  HF_TOKEN = "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"
23
  # set up the diarization pipeline
24
  diarization_pipeline = Pipeline.from_pretrained("pyannote/speaker-diarization-3.0", use_auth_token=HF_TOKEN)
 
34
 
35
  # run diarization while we wait for Whisper JAX
36
  progress(0, desc="Diarizing...")
37
+ # diarization = diarization_pipeline(audio_path)
38
+ # segments = diarization.for_json()["content"]
39
+
40
+ # convert diarization to JSON
41
+ diarization_json = pyannote.core.json.for_json(diarization)
42
+ segments = diarization_json["content"]
43
 
44
  transcription = segments
45