import gradio as gr from faster_whisper import WhisperModel device = "cpu" model_size = "base" compute_type = "int8" model = WhisperModel(model_size, device=device, compute_type=compute_type) def transcribe(audio): segments, _ = model.transcribe(audio, beam_size=5) return "".join([segment.text for segment in segments]) gr.Interface( title = 'Fast Whisper for Speech Recognition', description = 'This is a base version running on CPU with int8 compute type due to limited resources. These choices can slightly reduce accuracy.', fn=transcribe, inputs=[ gr.inputs.Audio(source="microphone", type="filepath") ], outputs=[ "textbox" ] ).launch()