LLM-Hindi-Large / main.py
mananvh's picture
Upload 13 files
11a232c verified
import gradio as gr
from transformers import pipeline
import torch
def init_transcription_pipeline():
device = "cuda:0" if torch.cuda.is_available() else "cpu"
model_path = "c:/Users/vhits/Documents/Speect2Text/model/whisper-hindi-large-v2"
transcribe_pipeline = pipeline(
task = "automatic-speech-recognition",
model = model_path,
chunk_length_s = 30,
device = device
)
transcribe_pipeline.model.config.forced_decoder_ids = transcribe_pipeline.tokenizer.get_decoder_prompt_ids(language="gu", task="transcribe")
return transcribe_pipeline
transcribe_pipeline = init_transcription_pipeline()
def transcribe_audio(audio_file_path):
transcription_result = transcribe_pipeline(audio_file_path)["text"]
return transcription_result
iface = gr.Interface(
fn = transcribe_audio,
inputs = gr.Audio(label="Upload your audio file", type="filepath"),
outputs=gr.Textbox(label="Transcription"),
title = "Gujarati Audio VH Test"
).launch()