import os os.system("pip install git+https://github.com/openai/whisper.git") import gradio as gr import whisper from convert import main model = whisper.load_model("small") def inference(audio): audio = whisper.load_audio(audio) audio = whisper.pad_or_trim(audio) mel = whisper.log_mel_spectrogram(audio).to(model.device) _, probs = model.detect_language(mel) options = whisper.DecodingOptions(fp16 = False) result = whisper.decode(model, mel, options) print(result.text) return result.text def inference2(url,mymodel): return main(url,mymodel) title="YouWhisper" description="YouWhisper converts Youtube videos to text using openai/whisper.." css = """ .gradio-container { font-family: 'IBM Plex Sans', sans-serif; } .gr-button { color: white; border-color: black; background: black; } input[type='range'] { accent-color: black; } .dark input[type='range'] { accent-color: #dfdfdf; } .container { max-width: 730px; margin: auto; padding-top: 1.5rem; } .details:hover { text-decoration: underline; } .gr-button { white-space: nowrap; } .gr-button:focus { border-color: rgb(147 197 253 / var(--tw-border-opacity)); outline: none; box-shadow: var(--tw-ring-offset-shadow), var(--tw-ring-shadow), var(--tw-shadow, 0 0 #0000); --tw-border-opacity: 1; --tw-ring-offset-shadow: var(--tw-ring-inset) 0 0 0 var(--tw-ring-offset-width) var(--tw-ring-offset-color); --tw-ring-shadow: var(--tw-ring-inset) 0 0 0 calc(3px var(--tw-ring-offset-width)) var(--tw-ring-color); --tw-ring-color: rgb(191 219 254 / var(--tw-ring-opacity)); --tw-ring-opacity: .5; } .footer { margin-bottom: 45px; margin-top: 35px; text-align: center; border-bottom: 1px solid #e5e5e5; } .footer>p { font-size: .8rem; display: inline-block; padding: 0 10px; transform: translateY(10px); background: white; } .dark .footer { border-color: #303030; } .dark .footer>p { background: #0b0f19; } .prompt h4{ margin: 1.25em 0 .25em 0; font-weight: bold; font-size: 115%; } .gr-dropdown { background-color: #fff; border: 1px solid #e5e5e5; border-radius: 4px; color: #000; cursor: pointer; display: inline-block; font-size: 1rem; font-weight: 400; line-height: 1.5; margin-bottom: 0; padding: .375rem .75rem; transition: border-color .15s ease-in-out,box-shadow .15s ease-in-out; vertical-align: middle; white-space: nowrap; width: 100%; } """ block = gr.Blocks(css=css) with block: gr.HTML( """
YouWhisper converts Youtube videos to text using openai/whisper..
Enter a Youtube url to convert to text
""" ) # add another textbox to get url from user url = gr.Textbox(label="URL", show_label=False, placeholder="Enter Youtube URL") # add dropdown to select the model mymodel = gr.Dropdown(["tiny", "base", "small", "medium"]) btn2 = gr.Button("Transcribe") text2 = gr.Textbox(show_label=False, placeholder="Transcription will appear here") btn2.click(inference2, inputs=[url, mymodel], outputs=[text2]) block.launch()