Spaces:

MitchelHsu
/

cleric-agent-ui

Sleeping

+from utils import preprocess_logs
+from langchain_openai import ChatOpenAI
+from config import examples, example_template, template_v2
+from langchain_core.prompts import PromptTemplate, FewShotPromptTemplate
+class Agent:
+    def __init__(self, model):
+        self.llm = ChatOpenAI(model=model)
+        # Example template
+        self.example_prompt = PromptTemplate(
+            template=example_template,
+            input_variables=['question', 'logs', 'answer']
+        )
+        # Few shot prompt template containing examples and instructions
+        self.prompt = FewShotPromptTemplate(
+            examples=examples,
+            example_prompt=self.example_prompt,
+            suffix=template_v2,
+            input_variables=['question', 'logs']
+        )
+        self.question = None
+        self.logs = None
+        self.response = None
+    def summarize(self, question, logs, retriever=None):
+        self.question = question
+        if retriever:
+            retrieved_logs = self.retrieve_logs(retriever)
+            prompt_formatted = self.prompt.format(
+                question=question,
+                logs=retrieved_logs
+            )
+        else:
+            self.logs = preprocess_logs(logs)
+            prompt_formatted = self.prompt.format(
+                question=question,
+                logs=self.logs
+            )
+        self.response = self.llm.predict(prompt_formatted)
+    def retrieve_logs(self, retriever):
+        retriever_nodes = retriever.retrieve(self.question)
+        retriever_nodes = sorted(retriever_nodes, key=lambda n: n.node_id, reverse=True)
+        return '\n'.join([node.text for node in retriever_nodes])
+    def get_question(self):
+        return self.question
+    def get_logs(self):
+        return self.logs
+    def get_response_list(self):
+        return self.response.split('\n')

app/app.py ADDED Viewed

	@@ -0,0 +1,107 @@

+from agent import Agent
+from flask import Flask, jsonify, request
+from config import MODEL, CHUNK_SIZE, CHUNK_OVERLAP, RETRIEVE_TOP_K
+from utils import read_documents, validate_request_logs, preprocess_logs
+from models import GetQuestionAndFactsResponse, SubmitQuestionAndDocumentsResponse, SubmitQuestionAndDocumentRequest
+from llama_index.core import VectorStoreIndex, Document
+from llama_index.core.node_parser import SentenceSplitter
+from llama_index.core.retrievers import VectorIndexRetriever
+app = Flask(__name__)
+agent = Agent(model=MODEL)
+processing = False
+submitted_data = None
+@app.route('/get_question_and_facts', methods=['GET'])
+def get_response():
+    global submitted_data, processing, agent
+    # If no data found
+    if not submitted_data:
+        response = GetQuestionAndFactsResponse(
+            question='',
+            facts=[],
+            status='No data found, please submit data'
+        )
+        return jsonify(response.dict()), 200
+    # If still processing request
+    if processing:
+        response = GetQuestionAndFactsResponse(
+            question=submitted_data.question,
+            facts=[],
+            status='processing'
+        )
+        return jsonify(response.dict()), 200
+    # Request processed, create response with Agent summarization
+    response = GetQuestionAndFactsResponse(
+        question=submitted_data.question,
+        facts=agent.get_response_list(),
+        status='done'
+    )
+    return jsonify(response.dict()), 200
+@app.route('/submit_question_and_documents', methods=['POST'])
+def submit_question():
+    global submitted_data, processing, agent
+    processing = True
+    request_content = request.get_json()
+    # Submit payload read and validation
+    try:
+        submitted_data = SubmitQuestionAndDocumentRequest(**request_content)
+    except ValueError as e:
+        response = SubmitQuestionAndDocumentsResponse(status=f'Request payload does not match expected schema: {str(e)}')
+        return jsonify(response.dict()), 200
+    # Validate request URLS formats
+    try:
+        validate_request_logs(submitted_data.documents)
+    except ValueError as e:
+        # Respond with URL validation failed error
+        response = SubmitQuestionAndDocumentsResponse(status=f'URL validation failed: {e}')
+        return jsonify(response.dict()), 200
+    # Try loading documents
+    try:
+        logs = read_documents(submitted_data.documents)
+    except Exception as e:
+        # Respond with URL read fail if URL read error
+        response = SubmitQuestionAndDocumentsResponse(status=f'URL read failed: {e}')
+        return jsonify(response.dict()), 200
+    # If no data found
+    if len(logs) == 0:
+        response = SubmitQuestionAndDocumentsResponse(status=f'No data found in the URLs')
+        return jsonify(response.dict()), 200
+    documents = [Document(text=preprocess_logs(logs))]
+    parser = SentenceSplitter(chunk_size=CHUNK_SIZE, chunk_overlap=CHUNK_OVERLAP)
+    nodes = parser.get_nodes_from_documents(documents)
+    # Set node time stamp
+    for i, node in enumerate(nodes):
+        node.id_ = i
+    index = VectorStoreIndex(nodes)
+    retriever = VectorIndexRetriever(index, similarity_top_k=RETRIEVE_TOP_K)
+    # Call agent to summarize logs
+    agent.summarize(
+        question=submitted_data.question,
+        logs=logs,
+        retriever=retriever
+    )
+    processing = False
+    response = SubmitQuestionAndDocumentsResponse(status='success')
+    return jsonify(response.dict()), 200
+if __name__ == '__main__':
+    app.run(host='0.0.0.0', port=8000, debug=True)

app/config.py ADDED Viewed

	@@ -0,0 +1,47 @@

+# LangChain templates
+template = """
+You are a call log summarization agent. Your job is to extract call summary bulletins only related to the question from a sequence of call logs. Please answer with bullets points only. Do not repeat facts in different bullets, and only response on facts with final decisions, avoid include previous decisions or decision process. Above are some examples of responses.\nGive response to the following question: {question}, according to the meeting logs:\n{logs}
+"""
+template_v2 = """
+You are a call log fact extraction agent. Your task is to process and extract information from a set of call logs based on a single question provided.
+Provide a concise list of facts extracted from the call logs that directly answer the question. Avoid including the conversation process of the facts in your response.  Provide only the list, without any other text. Each bullet should only contain one single fact. Please be mindful of the order of the logs and the updated facts/information/decisions and exclude any that have been canceled, including any associated relations.
+If the question seems irrelevant to the call logs provided, please just reply "The question seems irrelevant to the call logs provided.".
+Above are some response examples.
+Question: {question}
+List of Call Logs:
+{logs}
+"""
+example_template = """Question: {question}
+List of Call Logs:
+{logs}
+Answer:
+{answer}"""
+examples = [
+    {'logs': "00:00:10 - Alex: Let's choose our app's color scheme today.\n00:00:36 - Jordan: I suggest blue for a calm feel.\n00:00:51 - Casey: We need to make sure it's accessible to all users.",
+     'question': 'What product design decisions did the team make?',
+     'answer': "- The team will use blue for the color scheme of the app.\n- The team will make the app accessible to all users."},
+    {'logs': "1\n00:01:11,430 --> 00:01:40,520\n John: Hello, everybody. Let's start with the product design discussion. I think we should go with a modular design for our product. It will allow us to easily add or remove features as needed.\n\n2\n00:01:41,450 --> 00:01:49,190\nSara: I agree with John. A modular design will provide us with the flexibility we need. Also, I suggest we use a responsive design to ensure our product works well on all devices. Finally, I think we should use websockets to improve latency and provide real-time updates.\n\n3\n00:01:49,340 --> 00:01:50,040\nMike: Sounds good to me. I also propose we use a dark theme for the user interface. It's trendy and reduces eye strain for users. Let's hold off on the websockets for now since it's a little bit too much work.",
+     'question': 'What are our product design decisions?',
+     'answer': "- The team has decided to go with a modular design for the product.\n- The team has decided to use a responsive design to ensure the product works well on all devices.\n- The team has decided to use a dark theme for the user interface."},
+    {'logs': "1\n00:01:11,430 --> 00:01:40,520\nJohn: After giving it some more thought, I believe we should also consider a light theme option for the user interface. This will cater to users who prefer a brighter interface.\n\n2\n00:01:41,450 --> 00:01:49,190\nSara: That's a great idea, John. A light theme will provide an alternative to users who find the dark theme too intense.\n\n3\n00:01:49,340 --> 00:01:50,040\nMike: I'm on board with that.",
+     'question': 'What are our product design decisions?',
+     'answer': "- The team has decided to go with a modular design for the product.\n- The team has decided to use a responsive design to ensure the product works well on all devices.\n- The team has decided to provide both dark and light theme options for the user interface."},
+    {'logs': "1\n00:01:11,430 --> 00:01:40,520\nJohn: I've been thinking about our decision on the responsive design. While it's important to ensure our product works well on all devices, I think we should focus on desktop first. Our primary users will be using our product on desktops.\n\n2\n00:01:41,450 --> 00:01:49,190\nSara: I see your point, John. Focusing on desktop first will allow us to better cater to our primary users. I agree with this change.\n\n3\n00:01:49,340 --> 00:01:50,040\nMike: I agree as well. I also think the idea of using a modular design doesn't make sense. Let's not make that decision yet.",
+     'question': 'What are our product design decisions?',
+     'answer': "- The team has decided to focus on a desktop-first design\n- The team has decided to provide both dark and light theme options for the user interface."},
+]
+# OPENAI MODEL
+MODEL           = 'gpt-4'
+# LLamaIndex Configs
+CHUNK_SIZE      = 80  # For parser
+CHUNK_OVERLAP   = 20
+RETRIEVE_TOP_K  = 10

app/ui.py CHANGED Viewed

@@ -1,11 +1,11 @@
 import time
 import requests
 import gradio as gr
 from utils import get_url_list
 from models import SubmitQuestionAndDocumentRequest, GetQuestionAndFactsResponse, SubmitQuestionAndDocumentsResponse
-base_url = 'https://cleric-agent-api-untxx3isja-uc.a.run.app'
-# base_url = 'http://localhost:8000'
 def fetch_facts(question, call_log_urls):

+import os
 import time
 import requests
 import gradio as gr
 from utils import get_url_list
 from models import SubmitQuestionAndDocumentRequest, GetQuestionAndFactsResponse, SubmitQuestionAndDocumentsResponse
+base_url = os.environ['CLERIC_API_ENDPOINT']
 def fetch_facts(question, call_log_urls):