Spaces:

k2-fsa
/

automatic-speech-recognition

Running

App Files Files Community

csukuangfj commited on Jul 18, 2022

Commit

81687e9

•

1 Parent(s): f5b2e32

Minor fixes

Browse files

Files changed (1) hide show

app.py +32 -11

app.py CHANGED Viewed

@@ -49,6 +49,9 @@ def process(
     print("in_filename", in_filename)
     print("language", language)
     print("repo_id", repo_id)
     filename = convert_to_wav(in_filename)
     now = datetime.now()
@@ -89,7 +92,16 @@ def process(
     print("hyp")
     print(hyp)
-    return hyp
 title = "# Automatic Speech Recognition with Next-gen Kaldi"
@@ -113,7 +125,16 @@ def update_model_dropdown(language: str):
     raise ValueError(f"Unsupported language: {language}")
-demo = gr.Blocks()
 with demo:
     gr.Markdown(title)
@@ -124,7 +145,11 @@ with demo:
         choices=language_choices,
         value=language_choices[0],
     )
-    model_dropdown = gr.Dropdown(choices=[], label="Select a model")
     language_radio.change(
         update_model_dropdown,
         inputs=language_radio,
@@ -146,29 +171,25 @@ with demo:
     with gr.Tabs():
         with gr.TabItem("Upload from disk"):
-            uploaded_file = gr.inputs.Audio(
                 source="upload",  # Choose between "microphone", "upload"
                 type="filepath",
                 optional=False,
                 label="Upload from disk",
             )
             upload_button = gr.Button("Submit for recognition")
-            uploaded_output = gr.outputs.Textbox(
-                label="Recognized speech from uploaded file"
-            )
         with gr.TabItem("Record from microphone"):
-            microphone = gr.inputs.Audio(
                 source="microphone",  # Choose between "microphone", "upload"
                 type="filepath",
                 optional=False,
                 label="Record from microphone",
             )
-            recorded_output = gr.outputs.Textbox(
-                label="Recognized speech from recordings"
-            )
             record_button = gr.Button("Submit for recognition")
         upload_button.click(
             process,

     print("in_filename", in_filename)
     print("language", language)
     print("repo_id", repo_id)
+    print("decoding_method", decoding_method)
+    print("num_active_paths", num_active_paths)
     filename = convert_to_wav(in_filename)
     now = datetime.now()
     print("hyp")
     print(hyp)
+    html_output = f"""
+    <div class='result'>
+      <div class='result_item result_item_success'>
+        {hyp}
+        <br/>
+      </div>
+    </div>
+    """
+    return html_output
 title = "# Automatic Speech Recognition with Next-gen Kaldi"
     raise ValueError(f"Unsupported language: {language}")
+# The css style is copied from
+# https://huggingface.co/spaces/alphacep/asr/blob/main/app.py#L112
+demo = gr.Blocks(
+    css="""
+    .result {display:flex;flex-direction:column}
+    .result_item {padding:15px;margin-bottom:8px;border-radius:15px;width:100%}
+    .result_item_success {background-color:mediumaquamarine;color:white;align-self:start}
+    .result_item_error {background-color:#ff7070;color:white;align-self:start}
+    """,
+)
 with demo:
     gr.Markdown(title)
         choices=language_choices,
         value=language_choices[0],
     )
+    model_dropdown = gr.Dropdown(
+        choices=language_to_models[language_choices[0]],
+        label="Select a model",
+    )
     language_radio.change(
         update_model_dropdown,
         inputs=language_radio,
     with gr.Tabs():
         with gr.TabItem("Upload from disk"):
+            uploaded_file = gr.Audio(
                 source="upload",  # Choose between "microphone", "upload"
                 type="filepath",
                 optional=False,
                 label="Upload from disk",
             )
+            uploaded_output = gr.HTML(label="Recognized speech from uploaded file")
             upload_button = gr.Button("Submit for recognition")
         with gr.TabItem("Record from microphone"):
+            microphone = gr.Audio(
                 source="microphone",  # Choose between "microphone", "upload"
                 type="filepath",
                 optional=False,
                 label="Record from microphone",
             )
             record_button = gr.Button("Submit for recognition")
+            recorded_output = gr.HTML(label="Recognized speech from recordings")
         upload_button.click(
             process,