whisper-large-v3

Running

App Files Files Community

DeepLearning101 commited on Jun 16

Commit

2fbf87f

•

1 Parent(s): c6912e7

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -13

app.py CHANGED Viewed

@@ -77,6 +77,15 @@ def yt_transcribe(yt_url, task, max_filesize=75.0):
     return html_embed_str, text
 file_transcribe = gr.Interface(
     fn=transcribe,
     inputs=[
@@ -85,15 +94,19 @@ file_transcribe = gr.Interface(
     ],
     outputs="text",
     title="Whisper Large V3: Transcribe Audio",
-    description="""Transcribe long-form microphone or audio inputs with the click of a button! Demo uses the checkpoint openai/whisper-large-v3 and Transformers to transcribe audio files of arbitrary length.<br>
-        <a href='https://www.twman.org' target='_blank'>TonTon Huang Ph.D. </a><br>
-        <a href='https://blog.twman.org/2021/04/ASR.html' target='_blank'>那些語音處理 (Speech Processing) 踩的坑</a> | <a href='https://blog.twman.org/2021/04/NLP.html' target='_blank'>那些自然語言處理 (Natural Language Processing, NLP) 踩的坑</a><br>
-        <a href='https://blog.twman.org/2024/02/asr-tts.html' target='_blank'>那些ASR和TTS可能會踩的坑</a> | <a href='https://blog.twman.org/2024/02/LLM.html' target='_blank'>那些大模型開發會踩的坑</a><br>
-        <a href='https://blog.twman.org/2023/04/GPT.html' target='_blank'>什麼是大語言模型，它是什麼？想要嗎？</a><br>
-        <a href='https://blog.twman.org/2023/07/wsl.html' target='_blank'>用PaddleOCR的PPOCRLabel來微調醫療診斷書和收據</a> | <a href='https://blog.twman.org/2023/07/HugIE.html' target='_blank'>基於機器閱讀理解和指令微調的統一信息抽取框架之診斷書醫囑資訊擷取分析</a><br>
     allow_flagging="never",
 )
 yt_transcribe = gr.Interface(
     fn=yt_transcribe,
     inputs=[
@@ -102,16 +115,11 @@ yt_transcribe = gr.Interface(
     ],
     outputs=["html", "text"],
     title="Whisper Large V3: Transcribe YouTube",
-    description="""Transcribe long-form YouTube videos with the click of a button! Demo uses the checkpoint openai/whisper-large-v3 and Transformers to transcribe audio files of arbitrary length.<br>
-        <a href='https://www.twman.org' target='_blank'>TonTon Huang Ph.D. </a><br>
-        <a href='https://blog.twman.org/2021/04/ASR.html' target='_blank'>那些語音處理 (Speech Processing) 踩的坑</a> | <a href='https://blog.twman.org/2021/04/NLP.html' target='_blank'>那些自然語言處理 (Natural Language Processing, NLP) 踩的坑</a><br>
-        <a href='https://blog.twman.org/2024/02/asr-tts.html' target='_blank'>那些ASR和TTS可能會踩的坑</a> | <a href='https://blog.twman.org/2024/02/LLM.html' target='_blank'>那些大模型開發會踩的坑</a><br>
-        <a href='https://blog.twman.org/2023/04/GPT.html' target='_blank'>什麼是大語言模型，它是什麼？想要嗎？</a><br>
-        <a href='https://blog.twman.org/2023/07/wsl.html' target='_blank'>用PaddleOCR的PPOCRLabel來微調醫療診斷書和收據</a> | <a href='https://blog.twman.org/2023/07/HugIE.html' target='_blank'>基於機器閱讀理解和指令微調的統一信息抽取框架之診斷書醫囑資訊擷取分析</a><br>
     allow_flagging="never",
 )
 with gr.Blocks() as demo:
     gr.TabbedInterface([file_transcribe, yt_transcribe], ["Audio file", "YouTube"])
-demo.launch(debug=True)

     return html_embed_str, text
+description = """
+Transcribe long-form microphone or audio inputs with the click of a button! Demo uses the checkpoint openai/whisper-large-v3 and Transformers to transcribe audio files of arbitrary length.<br>
+<a href='https://www.twman.org' target='_blank'>TonTon Huang Ph.D. </a><br>
+<a href='https://blog.twman.org/2021/04/ASR.html' target='_blank'>那些語音處理 (Speech Processing) 踩的坑</a> | <a href='https://blog.twman.org/2021/04/NLP.html' target='_blank'>那些自然語言處理 (Natural Language Processing, NLP) 踩的坑</a><br>
+<a href='https://blog.twman.org/2024/02/asr-tts.html' target='_blank'>那些ASR和TTS可能會踩的坑</a> | <a href='https://blog.twman.org/2024/02/LLM.html' target='_blank'>那些大模型開發會踩的坑</a><br>
+<a href='https://blog.twman.org/2023/04/GPT.html' target='_blank'>什麼是大語言模型，它是什麼？想要嗎？</a><br>
+<a href='https://blog.twman.org/2023/07/wsl.html' target='_blank'>用PaddleOCR的PPOCRLabel來微調醫療診斷書和收據</a> | <a href='https://blog.twman.org/2023/07/HugIE.html' target='_blank'>基於機器閱讀理解和指令微調的統一信息抽取框架之診斷書醫囑資訊擷取分析</a><br>
+"""
 file_transcribe = gr.Interface(
     fn=transcribe,
     inputs=[
     ],
     outputs="text",
     title="Whisper Large V3: Transcribe Audio",
+    description=description,
     allow_flagging="never",
 )
+yt_description = """
+Transcribe long-form YouTube videos with the click of a button! Demo uses the checkpoint openai/whisper-large-v3 and Transformers to transcribe audio files of arbitrary length.<br>
+<a href='https://www.twman.org' target='_blank'>TonTon Huang Ph.D. </a><br>
+<a href='https://blog.twman.org/2021/04/ASR.html' target='_blank'>那些語音處理 (Speech Processing) 踩的坑</a> | <a href='https://blog.twman.org/2021/04/NLP.html' target='_blank'>那些自然語言處理 (Natural Language Processing, NLP) 踩的坑</a><br>
+<a href='https://blog.twman.org/2024/02/asr-tts.html' target='_blank'>那些ASR和TTS可能會踩的坑</a> | <a href='https://blog.twman.org/2024/02/LLM.html' target='_blank'>那些大模型開發會踩的坑</a><br>
+<a href='https://blog.twman.org/2023/04/GPT.html' target='_blank'>什麼是大語言模型，它是什麼？想要嗎？</a><br>
+<a href='https://blog.twman.org/2023/07/wsl.html' target='_blank'>用PaddleOCR的PPOCRLabel來微調醫療診斷書和收據</a> | <a href='https://blog.twman.org/2023/07/HugIE.html' target='_blank'>基於機器閱讀理解和指令微調的統一信息抽取框架之診斷書醫囑資訊擷取分析</a><br>
+"""
 yt_transcribe = gr.Interface(
     fn=yt_transcribe,
     inputs=[
     ],
     outputs=["html", "text"],
     title="Whisper Large V3: Transcribe YouTube",
+    description=yt_description,
     allow_flagging="never",
 )
 with gr.Blocks() as demo:
     gr.TabbedInterface([file_transcribe, yt_transcribe], ["Audio file", "YouTube"])
+demo.launch(debug=True)