Spaces:

SheldonYC
/

HKU_Canteen_VA

Sleeping

SheldonYC commited on Feb 28

Commit

5a17bb9

•

1 Parent(s): 02bfcfa

fix app.py

Files changed (2) hide show

app.py CHANGED Viewed

@@ -1,22 +1,43 @@
 from transformers import pipeline
 import gradio as gr
-model = pipeline("automatic-speech-recognition")
-def transcribe_audio(mic=None, file=None):
-  if mic is not None:
-    audio = mic
-  elif file is not None:
-    audio = file
-  else:
-    return("You must either provide a mic recording or a file")
-  transcription = model(audio)["text"]
-  return transcription
-gr.Interface(
-  fn=transcribe_audio,
-  inputs=[gr.Audio(source="microphone", type="filepath", optional=True),
-          gr.Audio(source ="upload", type="filepath", optional=True)],
-  outputs="text",
-  css=".footer{display:none !important}"
-).launch()

 from transformers import pipeline
+import numpy as np
 import gradio as gr
+def respond(message, chat_history):
+  bot_message = message
+  chat_history.append((message, bot_message))
+  return "", chat_history
+def transcribe(audio):
+  sr, y = audio
+  y = y.astype(np.float32)
+  y /= np.max(np.abs(y))
+  result = asr_model({"sampling_rate": sr, "raw": y})["text"]
+  return result
+asr_model_id = "openai/whisper-small.en"
+asr_model = pipeline("automatic-speech-recognition", model=asr_model_id)
+with gr.Blocks() as demo:
+  with gr.Column():
+    gr.Markdown(
+      """
+      # HKU Canteen VA
+      """)
+    va = gr.Chatbot(container=False)
+    with gr.Row(): # text input
+      text_input = gr.Textbox(placeholder="Ask me anything...", container=False, scale=1)
+      submit_btn = gr.Button("Submit", scale=0)
+    # with gr.Row():  # audio input
+    #   recording = gr.Microphone(show_download_button=False, container=False)
+    with gr.Row(): # button toolbar
+      clear = gr.ClearButton([text_input, va])
+  text_input.submit(respond, [text_input, va], [text_input, va], queue=False)
+  submit_btn.click(respond, [text_input, va], [text_input, va], queue=False)
+  # recording.stop_recording(transcribe, [recording], [text_input]).then(respond, [text_input, va], [text_input, va], queue=False)
+if __name__ == "__main__":
+    demo.launch()

requirements.txt CHANGED Viewed

@@ -1,2 +1,3 @@
 torch
-transformers

 torch
+transformers
+numpy