IliaLarchenko commited on
Commit
82598a2
·
1 Parent(s): 78654a1

Removed intermediate message object

Browse files
Files changed (3) hide show
  1. api/audio.py +4 -5
  2. api/llm.py +6 -5
  3. app.py +4 -6
api/audio.py CHANGED
@@ -31,10 +31,8 @@ class STTManager:
31
  self.config = config
32
  self.streaming = os.getenv("STREAMING", False)
33
 
34
- def speech_to_text(self, audio, convert_to_bytes=True):
35
- if convert_to_bytes:
36
- audio = numpy_audio_to_bytes(audio[1])
37
-
38
  try:
39
  if self.config.stt.type == "OPENAI_API":
40
  data = ("temp.wav", audio, "audio/wav")
@@ -54,7 +52,8 @@ class STTManager:
54
  except Exception as e:
55
  raise APIError(f"STT Error: Unexpected error: {e}")
56
 
57
- return transcription
 
58
 
59
 
60
  class TTSManager:
 
31
  self.config = config
32
  self.streaming = os.getenv("STREAMING", False)
33
 
34
+ def speech_to_text(self, audio, chat_display):
35
+ audio = numpy_audio_to_bytes(audio[1])
 
 
36
  try:
37
  if self.config.stt.type == "OPENAI_API":
38
  data = ("temp.wav", audio, "audio/wav")
 
52
  except Exception as e:
53
  raise APIError(f"STT Error: Unexpected error: {e}")
54
 
55
+ chat_display.append([transcription, None])
56
+ return chat_display
57
 
58
 
59
  class TTSManager:
api/llm.py CHANGED
@@ -122,15 +122,16 @@ class LLMManager:
122
  messages = self.get_problem_prepare_messages(requirements, difficulty, topic)
123
  yield from self.get_text_stream(messages)
124
 
125
- def update_chat_history(self, code, previous_code, message, chat_history):
 
126
  if code != previous_code:
127
  chat_history.append({"role": "user", "content": f"My latest code:\n{code}"})
128
  chat_history.append({"role": "user", "content": message})
129
 
130
  return chat_history
131
 
132
- def send_request_full(self, code, previous_code, message, chat_history, chat_display):
133
- chat_history = self.update_chat_history(code, previous_code, message, chat_history)
134
 
135
  reply = self.get_text(chat_history)
136
  chat_display.append([None, reply])
@@ -138,8 +139,8 @@ class LLMManager:
138
 
139
  return chat_history, chat_display, code
140
 
141
- def send_request_stream(self, code, previous_code, message, chat_history, chat_display):
142
- chat_history = self.update_chat_history(code, previous_code, message, chat_history)
143
 
144
  chat_display.append([None, ""])
145
  chat_history.append({"role": "assistant", "content": ""})
 
122
  messages = self.get_problem_prepare_messages(requirements, difficulty, topic)
123
  yield from self.get_text_stream(messages)
124
 
125
+ def update_chat_history(self, code, previous_code, chat_history, chat_display):
126
+ message = chat_display[-1][0]
127
  if code != previous_code:
128
  chat_history.append({"role": "user", "content": f"My latest code:\n{code}"})
129
  chat_history.append({"role": "user", "content": message})
130
 
131
  return chat_history
132
 
133
+ def send_request_full(self, code, previous_code, chat_history, chat_display):
134
+ chat_history = self.update_chat_history(code, previous_code, chat_history, chat_display)
135
 
136
  reply = self.get_text(chat_history)
137
  chat_display.append([None, reply])
 
139
 
140
  return chat_history, chat_display, code
141
 
142
+ def send_request_stream(self, code, previous_code, chat_history, chat_display):
143
+ chat_history = self.update_chat_history(code, previous_code, chat_history, chat_display)
144
 
145
  chat_display.append([None, ""])
146
  chat_history.append({"role": "assistant", "content": ""})
app.py CHANGED
@@ -133,7 +133,7 @@ with gr.Blocks(title="AI Interviewer") as demo:
133
  end_btn = gr.Button("Finish the interview", interactive=False)
134
  chat = gr.Chatbot(label="Chat", show_label=False, show_share_button=False)
135
  audio_input = gr.Audio(interactive=False, **default_audio_params)
136
- message = gr.Textbox(label="Message", lines=3, visible=False)
137
 
138
  with gr.Accordion("Feedback", open=True) as feedback_acc:
139
  feedback = gr.Markdown()
@@ -166,16 +166,14 @@ with gr.Blocks(title="AI Interviewer") as demo:
166
  fn=llm.end_interview, inputs=[description, chat_history], outputs=[feedback]
167
  )
168
 
169
- audio_input.stop_recording(fn=stt.speech_to_text, inputs=[audio_input], outputs=[message]).then(
170
  fn=lambda: None, outputs=[audio_input]
171
- ).then(fn=add_candidate_message, inputs=[message, chat], outputs=[chat]).then(
172
  fn=llm.send_request,
173
- inputs=[code, previous_code, message, chat_history, chat],
174
  outputs=[chat_history, chat, previous_code],
175
  ).then(
176
  fn=tts.read_last_message, inputs=[chat], outputs=[audio_output]
177
- ).then(
178
- fn=lambda: "", outputs=[message]
179
  )
180
 
181
  demo.launch(show_api=False)
 
133
  end_btn = gr.Button("Finish the interview", interactive=False)
134
  chat = gr.Chatbot(label="Chat", show_label=False, show_share_button=False)
135
  audio_input = gr.Audio(interactive=False, **default_audio_params)
136
+ # message = gr.Textbox(label="Message", lines=3, visible=False)
137
 
138
  with gr.Accordion("Feedback", open=True) as feedback_acc:
139
  feedback = gr.Markdown()
 
166
  fn=llm.end_interview, inputs=[description, chat_history], outputs=[feedback]
167
  )
168
 
169
+ audio_input.stop_recording(fn=stt.speech_to_text, inputs=[audio_input, chat], outputs=[chat]).then(
170
  fn=lambda: None, outputs=[audio_input]
171
+ ).then(
172
  fn=llm.send_request,
173
+ inputs=[code, previous_code, chat_history, chat],
174
  outputs=[chat_history, chat, previous_code],
175
  ).then(
176
  fn=tts.read_last_message, inputs=[chat], outputs=[audio_output]
 
 
177
  )
178
 
179
  demo.launch(show_api=False)