interviewer / api /llm.py
IliaLarchenko's picture
Reduced tts delay
eee97a9
raw
history blame
No virus
6.63 kB
import os
from openai import OpenAI
from utils.errors import APIError
from typing import List, Dict, Generator, Optional, Tuple
class PromptManager:
def __init__(self, prompts: Dict[str, str]):
self.prompts = prompts
self.limit = os.getenv("DEMO_WORD_LIMIT")
def add_limit(self, prompt: str) -> str:
"""
Add word limit to the prompt if specified in the environment variables.
"""
if self.limit:
prompt += f" Keep your responses very short and simple, no more than {self.limit} words."
return prompt
def get_system_prompt(self, key: str) -> str:
"""
Retrieve and limit a system prompt by its key.
"""
prompt = self.prompts[key]
return self.add_limit(prompt)
def get_problem_requirements_prompt(
self, type: str, difficulty: Optional[str] = None, topic: Optional[str] = None, requirements: Optional[str] = None
) -> str:
"""
Create a problem requirements prompt with optional parameters.
"""
prompt = f"Create a {type} problem. Difficulty: {difficulty}. Topic: {topic}. Additional requirements: {requirements}."
return self.add_limit(prompt)
class LLMManager:
def __init__(self, config, prompts: Dict[str, str]):
self.config = config
self.client = OpenAI(base_url=config.llm.url, api_key=config.llm.key)
self.prompt_manager = PromptManager(prompts)
self.status = self.test_llm(stream=False)
self.streaming = self.test_llm(stream=True) if self.status else False
def get_text(self, messages: List[Dict[str, str]], stream: Optional[bool] = None) -> Generator[str, None, None]:
"""
Generate text from the LLM, optionally streaming the response.
"""
if stream is None:
stream = self.streaming
try:
if not stream:
response = self.client.chat.completions.create(
model=self.config.llm.name, messages=messages, temperature=1, max_tokens=2000
)
yield response.choices[0].message.content.strip()
else:
response = self.client.chat.completions.create(
model=self.config.llm.name, messages=messages, temperature=1, stream=True, max_tokens=2000
)
for chunk in response:
if chunk.choices[0].delta.content:
yield chunk.choices[0].delta.content
except Exception as e:
raise APIError(f"LLM Get Text Error: Unexpected error: {e}")
def test_llm(self, stream=False) -> bool:
"""
Test the LLM connection with or without streaming.
"""
try:
list(
self.get_text(
[
{"role": "system", "content": "You just help me test the connection."},
{"role": "user", "content": "Hi!"},
{"role": "user", "content": "Ping!"},
],
stream=stream,
)
)
return True
except:
return False
def init_bot(self, problem: str, interview_type: str = "coding") -> List[Dict[str, str]]:
"""
Initialize the bot with a system prompt and problem description.
"""
system_prompt = self.prompt_manager.get_system_prompt(f"{interview_type}_interviewer_prompt")
return [{"role": "system", "content": f"{system_prompt}\nThe candidate is solving the following problem:\n {problem}"}]
def get_problem_prepare_messages(self, requirements: str, difficulty: str, topic: str, interview_type: str) -> List[Dict[str, str]]:
"""
Prepare messages for generating a problem based on given requirements.
"""
system_prompt = self.prompt_manager.get_system_prompt(f"{interview_type}_problem_generation_prompt")
full_prompt = self.prompt_manager.get_problem_requirements_prompt(interview_type, difficulty, topic, requirements)
return [
{"role": "system", "content": system_prompt},
{"role": "user", "content": full_prompt},
]
def get_problem(self, requirements: str, difficulty: str, topic: str, interview_type: str) -> Generator[str, None, None]:
"""
Get a problem from the LLM based on the given requirements, difficulty, and topic.
"""
messages = self.get_problem_prepare_messages(requirements, difficulty, topic, interview_type)
problem = ""
for text in self.get_text(messages):
problem += text
yield problem
def update_chat_history(
self, code: str, previous_code: str, chat_history: List[Dict[str, str]], chat_display: List[List[Optional[str]]]
) -> List[Dict[str, str]]:
"""
Update chat history with the latest user message and code.
"""
message = chat_display[-1][0]
if code != previous_code:
message += "\nMY NOTES AND CODE:\n" + code
chat_history.append({"role": "user", "content": message})
return chat_history
def end_interview_prepare_messages(
self, problem_description: str, chat_history: List[Dict[str, str]], interview_type: str
) -> List[Dict[str, str]]:
"""
Prepare messages to end the interview and generate feedback.
"""
transcript = [f"{message['role'].capitalize()}: {message['content']}" for message in chat_history[1:]]
system_prompt = self.prompt_manager.get_system_prompt(f"{interview_type}_grading_feedback_prompt")
return [
{"role": "system", "content": system_prompt},
{"role": "user", "content": f"The original problem to solve: {problem_description}"},
{"role": "user", "content": "\n\n".join(transcript)},
{"role": "user", "content": "Grade the interview based on the transcript provided and give feedback."},
]
def end_interview(
self, problem_description: str, chat_history: List[Dict[str, str]], interview_type: str = "coding"
) -> Generator[str, None, None]:
"""
End the interview and get feedback from the LLM.
"""
if len(chat_history) <= 2:
yield "No interview history available"
return
messages = self.end_interview_prepare_messages(problem_description, chat_history, interview_type)
feedback = ""
for text in self.get_text(messages):
feedback += text
yield feedback