Spaces:

AhmadFareedKhan
/

nutrition-chatbot

Sleeping

App Files Files Community

AhmadFareedKhan commited on Apr 30

Commit

cac2464

•

1 Parent(s): b93a002

Rename assistant.py to app.py

Browse files

Files changed (1) hide show

assistant.py → app.py +74 -70

assistant.py → app.py RENAMED Viewed

@@ -1,70 +1,74 @@
-import gradio as gr
-from openai import OpenAI
-import os
-from dotenv import load_dotenv
-import azure.cognitiveservices.speech as speechsdk
-# assistant single app
-# Load and set environment variables
-load_dotenv(".env")
-api_key = os.getenv("OPENAI_API_KEY")
-os.environ['SPEECH_KEY'] = '3ca965cb089e415d85a780e0ce40a3cf'
-os.environ['SPEECH_REGION'] = 'eastus'
-client = OpenAI(api_key=api_key)
-def recognize_from_microphone(file_info):
-    if not file_info:
-        return "", "No audio file received."
-    file_path = file_info
-    if not os.path.exists(file_path):
-        return "", f"File not found: {file_path}"
-    speech_config = speechsdk.SpeechConfig(subscription=os.environ['SPEECH_KEY'], region=os.environ['SPEECH_REGION'])
-    speech_config.speech_recognition_language = "en-US"
-    try:
-        audio_config = speechsdk.audio.AudioConfig(filename=file_path)
-        speech_recognizer = speechsdk.SpeechRecognizer(speech_config=speech_config, audio_config=audio_config)
-        result = speech_recognizer.recognize_once()
-        if result.reason == speechsdk.ResultReason.RecognizedSpeech:
-            return result.text, ""
-        elif result.reason == speechsdk.ResultReason.NoMatch:
-            return "", "No speech could be recognized."
-        elif result.reason == speechsdk.ResultReason.Canceled:
-            return "", f"Speech Recognition canceled: {result.cancellation_details.reason}."
-    except Exception as e:
-        return "", f"Error during speech recognition: {str(e)}"
-    return "", "Unexpected error during speech recognition."
-def chatbot_response(user_input="", audio_input=None):
-    transcription, error = recognize_from_microphone(audio_input) if audio_input else ("", "")
-    if transcription:
-        user_input = transcription
-    if not user_input.strip():
-        return error or "Please provide some input or speak into the microphone.", ""
-    try:
-        completion = client.chat.completions.create(
-            model="gpt-3.5-turbo",
-            messages=[
-                {"role": "system", "content": "As an AI serving as an emergency nutrition advisor, your objective is to provide prompt and accurate nutritional guidance in urgent situations. When users present their concerns, you should deliver tailored advice that addresses the critical aspects of their nutritional needs quickly and effectively. Focus on offering clear, practical, and context-specific solutions to ensure their immediate dietary requirements are met."},
-                {"role": "user", "content": user_input},
-            ]
-        )
-        response = completion.choices[0].message.content
-        return transcription, response
-    except Exception as e:
-        return transcription, f"An error occurred during response generation: {str(e)}"
-app = gr.Interface(
-    fn=chatbot_response,
-    inputs=[gr.Textbox(lines=5, placeholder="Enter your emergency nutrition query here...", label="Input Here"),
-            gr.Audio(type="filepath", label="Record your question")],
-    outputs=[gr.Text(label="Transcription"), gr.Text(label="Response")],
-    title="Emergency Assistance",
-    description="To better assist you, could you explain what led to this emergency?"
-)
-if __name__ == "__main__":
-    app.launch(share=False)

+import gradio as gr
+from openai import OpenAI
+import os
+from dotenv import load_dotenv
+import azure.cognitiveservices.speech as speechsdk
+import wave
+# Loads and set environment variables
+load_dotenv(".env")
+api_key = os.getenv("OPENAI_API_KEY")
+speech_key = os.getenv("speech_key")
+os.environ['SPEECH_REGION'] = 'eastus'
+client = OpenAI(api_key=api_key)
+def synthesize_speech(text, filename="output.wav"):
+    """ Converts text to speech and saves it to a WAV file. """
+    speech_config = speechsdk.SpeechConfig(subscription=speech_key, region=os.environ['SPEECH_REGION'])
+    speech_config.speech_synthesis_voice_name = "en-US-AvaMultilingualNeural"
+    audio_config = speechsdk.audio.AudioConfig(filename=filename)
+    synthesizer = speechsdk.SpeechSynthesizer(speech_config=speech_config, audio_config=audio_config)
+    result = synthesizer.speak_text_async(text).get()
+    if result.reason == speechsdk.ResultReason.SynthesizingAudioCompleted:
+        print(f"Speech synthesized for text [{text}] and saved to {filename}")
+    else:
+        print(f"Failed to synthesize speech for text [{text}]")
+    return filename
+def emergency_assistance(query):
+    if not query.strip():
+        return "Please provide a query for emergency assistance."
+    try:
+        completion = client.chat.completions.create(
+            model="gpt-3.5-turbo",
+            messages=[
+                {"role": "system", "content": "As an AI serving as an emergency nutrition advisor, your objective is to provide prompt and accurate nutritional guidance in urgent situations. When users present their concerns, you should deliver tailored advice that addresses the critical aspects of their nutritional needs quickly and effectively. Focus on offering clear, practical, and context-specific solutions to ensure their immediate dietary requirements are met."},
+                {"role": "user", "content": query},
+            ]
+        )
+        response = completion.choices[0].message.content
+    except Exception as e:
+        return f"An error occurred: {str(e)}"
+    # After generating response:
+    if response:
+        audio_path = synthesize_speech(response)
+        return response, audio_path  # Return both response text and audio path
+interface2 = gr.Interface(
+    fn=emergency_assistance,
+    inputs=[gr.Textbox(lines=10, label="Query", placeholder="Enter your emergency nutrition query here...")],
+    outputs=[
+        gr.Text(lines=10, label="Response"),
+        gr.Audio(label="Listen to Response")  # New audio output for the synthesized speech
+    ],
+    title="Emergency Assistance",
+    description="To better assist you, could you explain what led to this emergency?"
+)
+# Combined interface with tabs
+app = gr.TabbedInterface([interface2], ["Nutrition Consultant", "Emergency Assistance"], title="HealthyBytes: Your AI Nutrition Consultant")
+if __name__ == "__main__":
+    app.launch(share=False)