magic-8-ball

Running on Zero

App Files Files Community

freddyaboulton HF staff commited on Aug 21

Commit

7bd176a

•

1 Parent(s): 4a0236d

Modify

Browse files

Files changed (1) hide show

app.py +5 -4

app.py CHANGED Viewed

@@ -65,6 +65,7 @@ frame_rate = model.audio_encoder.config.frame_rate
 def generate_response(audio):
     gr.Info("Transcribing Audio", duration=5)
     question = client.automatic_speech_recognition(audio).text
@@ -73,11 +74,11 @@ def generate_response(audio):
                                               "is to answer with a cryptic addage or proverb such as "
                                               "'curiosity killed the cat' or 'The early bird gets the worm'."
                                               "Keep your answers short.")},
-                {"role": "user", "content": f"Magic 8 ball, please tell me what to do about {question}"}]
     response = client.chat_completion(messages, max_tokens=64, seed=random.randint(1, 5000))
     response = response.choices[0].message.content
-    return response
 @spaces.GPU
 def generate_base(answer):
@@ -106,7 +107,7 @@ def generate_base(answer):
     for new_audio in streamer:
         print(f"Sample of length: {round(new_audio.shape[0] / sampling_rate, 2)} seconds")
-        yield gr.Textbox(value=answer, visible=True), numpy_to_mp3(new_audio, sampling_rate=sampling_rate)
 css=""".my-group {max-width: 600px !important; max-height: 600 !important;}
                       .my-column {display: flex !important; justify-content: center !important; align-items: center !important};"""
@@ -128,6 +129,6 @@ with gr.Blocks() as block:
         with gr.Row():
             audio_in = gr.Audio(label="Speak you question", sources="microphone", type="filepath")
-    audio_in.stop_recording(generate_response, audio_in, [state]).then(fn=generate_base, inputs=state, outputs=[answer, audio_out])
 block.launch()

 def generate_response(audio):
+    yield None, None
     gr.Info("Transcribing Audio", duration=5)
     question = client.automatic_speech_recognition(audio).text
                                               "is to answer with a cryptic addage or proverb such as "
                                               "'curiosity killed the cat' or 'The early bird gets the worm'."
                                               "Keep your answers short.")},
+                {"role": "user", "content": f"Please tell me what to do about {question}"}]
     response = client.chat_completion(messages, max_tokens=64, seed=random.randint(1, 5000))
     response = response.choices[0].message.content
+    yield response, None
 @spaces.GPU
 def generate_base(answer):
     for new_audio in streamer:
         print(f"Sample of length: {round(new_audio.shape[0] / sampling_rate, 2)} seconds")
+        yield answer, numpy_to_mp3(new_audio, sampling_rate=sampling_rate)
 css=""".my-group {max-width: 600px !important; max-height: 600 !important;}
                       .my-column {display: flex !important; justify-content: center !important; align-items: center !important};"""
         with gr.Row():
             audio_in = gr.Audio(label="Speak you question", sources="microphone", type="filepath")
+    audio_in.stop_recording(generate_response, audio_in, state).then(fn=generate_base, inputs=state, outputs=[answer, audio_out])
 block.launch()