Spaces:

Madhuslista
/

whisper_wrapper

Sleeping

Madhuslista commited on Nov 25, 2023

Commit

df236d9

•

1 Parent(s): e43ce77

Refactor: Modify PIPE parameters

Files changed (1) hide show

lib/pipe.py CHANGED Viewed

@@ -5,6 +5,12 @@ from time import time
 from transformers import pipeline
 # -->> Tunables <<---------------------
 print("Loading model...")
@@ -13,6 +19,7 @@ PIPE = pipeline(
     task="automatic-speech-recognition",
     model="openai/whisper-large-v3",
     device_map="auto",
 )
 time_2 = time()
 print("Model loaded!")
@@ -26,7 +33,12 @@ def connect_to_pipe(audio_file, audio_path, transcript_folder_path):
     print("Transcribing...")
     time_3 = time()
-    result = PIPE(audio_path)
     time_4 = time()
     print("Transcription complete!")
@@ -36,8 +48,8 @@ def connect_to_pipe(audio_file, audio_path, transcript_folder_path):
     print("Total:           ", round(time_2 - time_1 + time_4 - time_3, 2), " [s]")
     # Save the transcript to a file
-    print(result)
     # text = "\n ".join([i["text"] for i in result["chunks"]])
     return result

 from transformers import pipeline
+from .config import (
+    DEVICE,
+    COMPUTE_TYPE,
+    BATCH_SIZE,
+)
 # -->> Tunables <<---------------------
 print("Loading model...")
     task="automatic-speech-recognition",
     model="openai/whisper-large-v3",
     device_map="auto",
+    chunk_length_s=30,
 )
 time_2 = time()
 print("Model loaded!")
     print("Transcribing...")
     time_3 = time()
+    result = PIPE(
+        audio_path,
+        batch_size=BATCH_SIZE,
+        generate_kwargs={"task": "transcribe"},
+        return_timestamps=True,
+    )
     time_4 = time()
     print("Transcription complete!")
     print("Total:           ", round(time_2 - time_1 + time_4 - time_3, 2), " [s]")
     # Save the transcript to a file
     # text = "\n ".join([i["text"] for i in result["chunks"]])
+    text = result['text']
     return result