Spaces:

asif00
/

whisper-bangla

Running

asif00 commited on Jun 3, 2024

Commit

17c1345

verified ·

1 Parent(s): 5f3b06a

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,16 +1,36 @@
 from transformers import pipeline
 import gradio as gr
-pipe = pipeline(model="asif00/whisper-bangla")
 def transcribe(audio):
-    text = pipe(audio)["text"]
     return text
 iface = gr.Interface(
-    fn=transcribe,
     inputs=gr.Audio(sources="microphone", type="filepath"),
     outputs="text",
     title="Whisper Bangla",

+import spaces
 from transformers import pipeline
 import gradio as gr
+import torch
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+asr = pipeline(model="asif00/whisper-bangla").to(device=device)
+ser = pipeline("text2text-generation", model="asif00/mbart_bn_error_correction").to(
+    device=device
+)
+@spaces.GPU
 def transcribe(audio):
+    text = asr(audio)["text"]
     return text
+@spaces.GPU
+def correction(text):
+    corrected_text = ser(text)
+    print(corrected_text)
+    return corrected_text
+def transcribe_and_correct(audio):
+    text = transcribe(audio)
+    corrected_text = correction(text)
+    return corrected_text
 iface = gr.Interface(
+    fn=transcribe_and_correct,
     inputs=gr.Audio(sources="microphone", type="filepath"),
     outputs="text",
     title="Whisper Bangla",