Update audio2text/a2t.py
Browse files- audio2text/a2t.py +3 -2
audio2text/a2t.py
CHANGED
@@ -3,6 +3,7 @@ import numpy as np
|
|
3 |
from .init import pipe
|
4 |
|
5 |
TASK = "transcribe"
|
|
|
6 |
|
7 |
class A2T:
|
8 |
def __init__(self, mic):
|
@@ -12,7 +13,7 @@ class A2T:
|
|
12 |
if inputs is None:
|
13 |
print("Inputs None")
|
14 |
|
15 |
-
transcribed_text = pipe(inputs, generate_kwargs={"task": task}, return_timestamps=True)["text"]
|
16 |
print("transcribed_text : ", transcribed_text)
|
17 |
return transcribed_text
|
18 |
|
@@ -20,7 +21,7 @@ class A2T:
|
|
20 |
try:
|
21 |
if self.mic is not None:
|
22 |
chunk = self.mic
|
23 |
-
audio = np.
|
24 |
print("audio : ", audio)
|
25 |
else:
|
26 |
return "please provide audio"
|
|
|
3 |
from .init import pipe
|
4 |
|
5 |
TASK = "transcribe"
|
6 |
+
BATCH_SIZE = 16
|
7 |
|
8 |
class A2T:
|
9 |
def __init__(self, mic):
|
|
|
13 |
if inputs is None:
|
14 |
print("Inputs None")
|
15 |
|
16 |
+
transcribed_text = pipe(inputs, batch_size=BATCH_SIZE, generate_kwargs={"task": task}, return_timestamps=True)["text"]
|
17 |
print("transcribed_text : ", transcribed_text)
|
18 |
return transcribed_text
|
19 |
|
|
|
21 |
try:
|
22 |
if self.mic is not None:
|
23 |
chunk = self.mic
|
24 |
+
audio = np.frombuffer(chunk, dtype=np.uint8)
|
25 |
print("audio : ", audio)
|
26 |
else:
|
27 |
return "please provide audio"
|