check_pronounciation

Sleeping

App Files Files Community

Mrlongpro commited on Sep 18, 2024

Commit

e6d5013

verified ·

1 Parent(s): f42a490

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -11

app.py CHANGED Viewed

@@ -2,14 +2,15 @@ import gradio as gr
 import speech_recognition as sr
 import difflib
-# Hàm chuyển giọng nói thành văn bản
-def transcribe_speech():
     recognizer = sr.Recognizer()
-    with sr.Microphone() as source:
         # Điều chỉnh tiếng ồn nền và ghi âm
         recognizer.adjust_for_ambient_noise(source, duration=1)
-        audio = recognizer.listen(source)
         try:
             # Chuyển giọng nói thành văn bản
@@ -37,8 +38,8 @@ def compare_transcription(transcribed_text, reference_text):
     return accuracy, incorrect_words
 # Hàm tích hợp để dùng trên Gradio
-def process_speech(reference_text):
-    transcribed_text = transcribe_speech()
     if "Lỗi" in transcribed_text or "Không thể nhận diện" in transcribed_text:
         return transcribed_text, None, None
@@ -52,17 +53,21 @@ def build_interface():
     with gr.Blocks() as demo:
         # Input cho văn bản mẫu
         reference_text = gr.Textbox(label="Văn bản mẫu", value="Xin chào, tôi là ChatGPT", lines=2)
-        inputs=gr.Audio(type="filepath"),  # Input as audio, no need for 'source' argument
-        # Button để ghi âm
-        record_button = gr.Button("Ghi âm và kiểm tra")
         # Output hiển thị kết quả
         transcribed_text = gr.Textbox(label="Văn bản bạn nói")
         accuracy = gr.Textbox(label="Độ chính xác (%)")
         incorrect_words = gr.Textbox(label="Những từ nói sai")
         # Nút ghi âm được kết nối với chức năng xử lý
-        record_button.click(fn=process_speech, inputs=[reference_text], outputs=[transcribed_text, accuracy, incorrect_words])
     return demo

 import speech_recognition as sr
 import difflib
+# Hàm chuyển giọng nói thành văn bản từ file
+def transcribe_speech(audio_file):
     recognizer = sr.Recognizer()
+    # Load audio file
+    with sr.AudioFile(audio_file) as source:
         # Điều chỉnh tiếng ồn nền và ghi âm
         recognizer.adjust_for_ambient_noise(source, duration=1)
+        audio = recognizer.record(source)
         try:
             # Chuyển giọng nói thành văn bản
     return accuracy, incorrect_words
 # Hàm tích hợp để dùng trên Gradio
+def process_speech(reference_text, audio_file):
+    transcribed_text = transcribe_speech(audio_file)
     if "Lỗi" in transcribed_text or "Không thể nhận diện" in transcribed_text:
         return transcribed_text, None, None
     with gr.Blocks() as demo:
         # Input cho văn bản mẫu
         reference_text = gr.Textbox(label="Văn bản mẫu", value="Xin chào, tôi là ChatGPT", lines=2)
+        # Input cho file âm thanh
+        audio_input = gr.Audio(type="filepath", label="Tải lên file âm thanh")
         # Output hiển thị kết quả
         transcribed_text = gr.Textbox(label="Văn bản bạn nói")
         accuracy = gr.Textbox(label="Độ chính xác (%)")
         incorrect_words = gr.Textbox(label="Những từ nói sai")
         # Nút ghi âm được kết nối với chức năng xử lý
+        gr.Button("Ghi âm và kiểm tra").click(
+            fn=process_speech,
+            inputs=[reference_text, audio_input],
+            outputs=[transcribed_text, accuracy, incorrect_words]
+        )
     return demo