Spaces:

miminions
/

MiFactory

Runtime error

App Files Files Community

shengxiong commited on May 23

Commit

f5f1842

•

1 Parent(s): d415e7e

update the code to align with latest packages

Browse files

On branch main
Your branch is up to date with 'origin/main'.

Changes to be committed:
modified: .gitignore
modified: app.py
modified: supplier.py

Files changed (3) hide show

.gitignore +1 -1
app.py +6 -6
supplier.py +29 -27

.gitignore CHANGED Viewed

@@ -1,6 +1,6 @@
 # directories that are local to the server os
 .archive
-venv
 __pycache__
 # files local to the server os

 # directories that are local to the server os
 .archive
+.venv
 __pycache__
 # files local to the server os

app.py CHANGED Viewed

@@ -25,10 +25,10 @@ with gr.Blocks() as settings:
             gr.Examples(background_examples,background_edit,label="Examples")
             clear.click(lambda:None,None,background_edit,queue=False)
             submit.click(update_sys,background_edit,background,queue=False)
-    with gr.Row():
-        voices_list = gr.Dropdown([v["Name"] for v in get_voices()],label="Voices")
-    voices_list.change(lambda voice:App_state.update({"voice":voice}),voices_list,queue=False)
 with gr.Blocks() as chat_window:
     with gr.Row():
@@ -37,15 +37,15 @@ with gr.Blocks() as chat_window:
             chatbot_speech = gr.Audio()
             with gr.Column():
                 chat_clear = gr.Button("Clear")
-                play_speech = gr.Button("Play")
         chat_clear.click(lambda:None,None,chatbot,queue=False)
-        play_speech.click(text_to_audio,chatbot,chatbot_speech,queue=False)
         with gr.Column():
             msg = gr.Textbox()
             submit = gr.Button("Submit")
             gr.Examples(["Hello","How are you?"],msg,label="Examples")
-            audio = gr.Audio(source="microphone",type="filepath")
             # gr.Interface(translate,inputs=gr.Audio(source="microphone",type="filepath"),outputs = "text")
         audio.change(translate,audio,msg,queue=False)

             gr.Examples(background_examples,background_edit,label="Examples")
             clear.click(lambda:None,None,background_edit,queue=False)
             submit.click(update_sys,background_edit,background,queue=False)
+    # with gr.Row():
+    #     voices_list = gr.Dropdown([v["Name"] for v in get_voices()],label="Voices")
+    # voices_list.change(lambda voice:App_state.update({"voice":voice}),voices_list,queue=False)
 with gr.Blocks() as chat_window:
     with gr.Row():
             chatbot_speech = gr.Audio()
             with gr.Column():
                 chat_clear = gr.Button("Clear")
+                # play_speech = gr.Button("Play")
         chat_clear.click(lambda:None,None,chatbot,queue=False)
+        # play_speech.click(text_to_audio,chatbot,chatbot_speech,queue=False)
         with gr.Column():
             msg = gr.Textbox()
             submit = gr.Button("Submit")
             gr.Examples(["Hello","How are you?"],msg,label="Examples")
+            audio = gr.Audio(sources="microphone",type="filepath")
             # gr.Interface(translate,inputs=gr.Audio(source="microphone",type="filepath"),outputs = "text")
         audio.change(translate,audio,msg,queue=False)

supplier.py CHANGED Viewed

@@ -1,5 +1,5 @@
 import openai
-import boto3
 import os
 import pydub
@@ -7,8 +7,8 @@ import numpy as np
 # setup the api keys
 openai.api_key = os.environ.get("OPENAI_API_KEY")
-aws_access_key_id = os.environ.get("AWS_ACCESS_KEY_ID")
-aws_secret_access_key = os.environ.get("AWS_SECRET_ACCESS_KEY")
 sys_msg = [{
     "role": "system",
@@ -27,28 +27,28 @@ App_state = {
 }
 # setup the polly client
-polly_client = boto3.client(
-    "polly", # the service we want to use
-    aws_access_key_id=aws_access_key_id,
-    aws_secret_access_key=aws_secret_access_key,
-    region_name='us-east-1')
-def get_voices():
-    return polly_client.describe_voices()["Voices"]
-# return the audio based on the text
-def text_to_audio(messages,voice="Joanna",sample_rate = 22050):
-    text = messages[-1][1]
-    response = polly_client.synthesize_speech(VoiceId=voice,
-                OutputFormat='mp3',
-                SampleRate=str(sample_rate),
-                Text = text)
-    buffer = response["AudioStream"].read()
-    audio_stream = np.frombuffer(buffer,dtype=np.uint16)
-    return sample_rate,audio_stream
 def send_chat(text,messages=[]):
     '''
@@ -81,12 +81,12 @@ def send_chat(text,messages=[]):
         }
     ])
-    res = openai.ChatCompletion.create(
-            model="gpt-3.5-turbo",
             messages=openai_messages
         )
-    assistant_text = res.choices[0]["message"]["content"]
     messages.append((text,assistant_text))
     App_state.update({"messages":messages})
@@ -96,7 +96,9 @@ def send_chat(text,messages=[]):
 def translate(file_path):
     if file_path:
         f = open(file_path,"rb")
-        res = openai.Audio.translate("whisper-1",f)
-        return res["text"]
     else:
         return ""

 import openai
+# import boto3
 import os
 import pydub
 # setup the api keys
 openai.api_key = os.environ.get("OPENAI_API_KEY")
+# aws_access_key_id = os.environ.get("AWS_ACCESS_KEY_ID")
+# aws_secret_access_key = os.environ.get("AWS_SECRET_ACCESS_KEY")
 sys_msg = [{
     "role": "system",
 }
 # setup the polly client
+# polly_client = boto3.client(
+#     "polly", # the service we want to use
+#     aws_access_key_id=aws_access_key_id,
+#     aws_secret_access_key=aws_secret_access_key,
+#     region_name='us-east-1')
+# def get_voices():
+#     return polly_client.describe_voices()["Voices"]
+# # return the audio based on the text
+# def text_to_audio(messages,voice="Joanna",sample_rate = 22050):
+#     text = messages[-1][1]
+#     response = polly_client.synthesize_speech(VoiceId=voice,
+#                 OutputFormat='mp3',
+#                 SampleRate=str(sample_rate),
+#                 Text = text)
+#     buffer = response["AudioStream"].read()
+#     audio_stream = np.frombuffer(buffer,dtype=np.uint16)
+#     return sample_rate,audio_stream
 def send_chat(text,messages=[]):
     '''
         }
     ])
+    res = openai.chat.completions.create(
+            model="gpt-4-turbo",
             messages=openai_messages
         )
+    assistant_text = res.choices[0].message.content
     messages.append((text,assistant_text))
     App_state.update({"messages":messages})
 def translate(file_path):
     if file_path:
         f = open(file_path,"rb")
+        res = openai.audio.translations.create(
+            file=f,
+            model="whisper-1")
+        return res.text
     else:
         return ""