Spaces:

heliosbrahma
/

voice-assistant

Sleeping

heliosbrahma commited on Apr 1, 2023

Commit

c33ad65

1 Parent(s): 6a33919

first commit

Files changed (3) hide show

README.md CHANGED Viewed

@@ -5,8 +5,14 @@ colorFrom: gray
 colorTo: gray
 sdk: gradio
 sdk_version: 3.23.0
-app_file: app.py
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 colorTo: gray
 sdk: gradio
 sdk_version: 3.23.0
+app_file: main.py
 pinned: false
 ---
+# Smart Voice Assistant
+Use this gradio app interface to get answers for all your queries in both text and speech format. Just communicate your queries in speech format and this app will take care of the rest.
+This app is built using ChatGPT API and Whisper API.
+## To generate OpenAI API key:
+* Login to https://platform.openai.com/account/api-keys
+* Click on "Create new secret key" button and copy the API key

main.py ADDED Viewed

+import whisper
+import gradio as gr
+import openai
+from TTS.api import TTS
+import subprocess
+model_name = TTS.list_models()[9]
+tts = TTS(model_name)
+model = whisper.load_model('medium')
+def run_ffmpeg_command():
+    command = ['ffmpeg', '-f', 'lavfi', '-i', 'anullsrc=r=44100:cl=mono', '-t', '1', '-q:a', '9', '-acodec', 'libmp3lame', 'output.wav']
+    result = subprocess.run(command, capture_output=True, text=True)
+    print(result.stdout)
+def voice_chat(api_key, user_voice):
+    openai.api_key = str(api_key)
+    messages = [
+    {"role": "system", "content": "You are a kind helpful assistant."},
+    ]
+    user_message = model.transcribe(user_voice)["text"]
+    messages.append(
+        {"role": "user", "content": user_message},
+    )
+    chat = openai.ChatCompletion.create(
+        model="gpt-3.5-turbo", messages=messages
+    )
+    reply = chat.choices[0].message.content
+    messages.append({"role": "assistant", "content": reply})
+    tts.tts_to_file(text=reply, file_path="output.wav")
+    return(reply, "output.wav")
+# run_ffmpeg_command()
+text_reply = gr.Textbox(label="Summarized Answer")
+voice_reply = gr.Audio(type="filepath")
+gr.Interface(
+    title = 'Smart Voice Assistant',
+    fn=voice_chat,
+    inputs=[
+        gr.Textbox(label="OpenAI API Key"),
+        gr.Audio(source="microphone", type="filepath")
+    ],
+    outputs=[
+        text_reply,  voice_reply
+    ]).launch()

requirements.txt ADDED Viewed

+numpy==1.21.6
+numba==0.53
+TTS
+openai-whisper
+openai
+gradio