Spaces:

Madhuslista
/

whisper_wrapper

Sleeping

Madhuslista commited on Nov 25, 2023

Commit

8ee91c9

1 Parent(s): 138226e

Feature: Add time measurements

Files changed (1) hide show

lib/model.py CHANGED Viewed

@@ -2,6 +2,7 @@
 # -*- coding: utf-8 -*-
 import gc
 import torch
 import whisperx as wx
@@ -27,13 +28,25 @@ def transcribe_audio(audio_file, audio_path, transcript_folder_path):
     # Transcribe the audio
     print("Starting transcription...")
     print("Loading model...")
     model = wx.load_model("large-v2", device=DEVICE, compute_type=COMPUTE_TYPE, language="en")
     print("Loading audio...")
     audio = wx.load_audio(audio_path)
     print("Transcribing...")
     result = model.transcribe(audio, batch_size=BATCH_SIZE)
     print("Transcription complete!")
     # Save the transcript to a file
     text = "\n ".join([i["text"] for i in result["segments"]])

 # -*- coding: utf-8 -*-
 import gc
+from time import time
 import torch
 import whisperx as wx
     # Transcribe the audio
     print("Starting transcription...")
     print("Loading model...")
+    time_1 = time()
     model = wx.load_model("large-v2", device=DEVICE, compute_type=COMPUTE_TYPE, language="en")
+    time_2 = time()
     print("Loading audio...")
+    time_3 = time()
     audio = wx.load_audio(audio_path)
+    time_4 = time()
     print("Transcribing...")
+    time_5 = time()
     result = model.transcribe(audio, batch_size=BATCH_SIZE)
+    time_6 = time()
     print("Transcription complete!")
+    print("\nTime Report:   ")
+    print("Loading model:   ", round(time_2 - time_1,2), " [s]")
+    print("Loading audio:   ", round(time_4 - time_3,2), " [s]")
+    print("Transcribing:    ", round(time_6 - time_5,2), " [s]")
+    print("Total:           ", round(time_6 - time_1,2), " [s]")
     # Save the transcript to a file
     text = "\n ".join([i["text"] for i in result["segments"]])