Spaces:

CineAI
/

Chelsea

Sleeping

CineAI commited on Mar 27, 2024

Commit

615c558

verified ·

1 Parent(s): b12e8e8

Update audio2text/a2t.py

Files changed (1) hide show

audio2text/a2t.py CHANGED Viewed

@@ -10,18 +10,18 @@ class A2T:
     def __init__(self, mic):
         self.mic = mic
-    def __transcribe(self, inputs, task: str = None):
         if inputs is  None:
             print("Inputs None")
-        transcribed_text = pipe(inputs, batch_size=BATCH_SIZE,)["text"]
         return transcribed_text
     def __preprocces(self, raw: np.ndarray, sampling_rate: int):
         chunk = raw.astype(np.float32) / 32678.0
-        if sampling_rate != 16000:
-            chunk = librosa.resample(chunk, orig_sr=sampling_rate, target_sr=16000)
         # chunk = chunk[:16000*LIMIT]

     def __init__(self, mic):
         self.mic = mic
+    def __transcribe(self, inputs, task: str = None, lang: str = "english"):
         if inputs is  None:
             print("Inputs None")
+        transcribed_text = pipe(inputs, batch_size=BATCH_SIZE, generate_kwargs={"task": task, "language": lang}, return_timestamps=True)["text"]
         return transcribed_text
     def __preprocces(self, raw: np.ndarray, sampling_rate: int):
         chunk = raw.astype(np.float32) / 32678.0
+        # if sampling_rate != 16000:
+        #     chunk = librosa.resample(chunk, orig_sr=sampling_rate, target_sr=16000)
         # chunk = chunk[:16000*LIMIT]