Spaces:

MitchelHsu
/

cleric-agent-ui

Sleeping

App Files Files Community

MitchelHsu commited on Apr 20

Commit

be41d24

•

1 Parent(s): f8d7a54

Upload folder using huggingface_hub

Browse files

Files changed (12) hide show

.gitignore +7 -0
Dockerfile +9 -0
Procfile +1 -0
README.md +3 -8
app/agent.py +46 -0
app/app.py +66 -0
app/config.py +40 -0
app/models.py +17 -0
app/ui.py +70 -0
app/utils.py +28 -0
main.py +45 -0
requirements.txt +7 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,7 @@

+__pycache__/
+# PyCharm
+.idea/
+# test logs
+test_logs/

Dockerfile ADDED Viewed

	@@ -0,0 +1,9 @@

+FROM python:3.10-alpine
+ARG KEY
+WORKDIR /app
+COPY . .
+RUN pip3 install -r requirements.txt
+ENV OPENAI_API_KEY=$KEY
+CMD ["python3", "app/app.py"]

Procfile ADDED Viewed

	@@ -0,0 +1 @@


1	+ web: gunicorn app.app:app

README.md CHANGED Viewed

@@ -1,12 +1,7 @@
 ---
-title: Cleric Agent Ui
-emoji: 🦀
-colorFrom: gray
-colorTo: yellow
 sdk: gradio
 sdk_version: 4.27.0
-app_file: app.py
-pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: cleric-agent-ui
+app_file: app/ui.py
 sdk: gradio
 sdk_version: 4.27.0
 ---
+# Doc-retrieve-agent

app/agent.py ADDED Viewed

	@@ -0,0 +1,46 @@

+from langchain_openai import ChatOpenAI
+from config import examples, example_template, template_v2
+from langchain_core.prompts import PromptTemplate, FewShotPromptTemplate
+class Agent:
+    def __init__(self, model):
+        self.llm = ChatOpenAI(model=model)
+        # Example template
+        self.example_prompt = PromptTemplate(
+            template=example_template,
+            input_variables=['question', 'logs', 'answer']
+        )
+        # Few shot prompt template containing examples and instructions
+        self.prompt = FewShotPromptTemplate(
+            examples=examples,
+            example_prompt=self.example_prompt,
+            suffix=template_v2,
+            input_variables=['question', 'logs']
+        )
+        self.question = None
+        self.logs = None
+        self.response = None
+    def process_request(self, question, logs):
+        self.question = question
+        self.logs = logs
+        prompt_formatted = self.prompt.format(
+            question=question,
+            logs=logs
+        )
+        self.response = self.llm.predict(prompt_formatted)
+    def get_question(self):
+        return self.question
+    def get_logs(self):
+        return self.logs
+    def get_response_list(self):
+        return self.response.split('\n')

app/app.py ADDED Viewed

	@@ -0,0 +1,66 @@

+import time
+from agent import Agent
+from config import MODEL
+from flask import Flask, jsonify, request
+from utils import read_documents, preprocess_logs
+from models import GetQuestionAndFactsResponse, SubmitQuestionAndDocumentsResponse, SubmitQuestionAndDocumentRequest
+app = Flask(__name__)
+agent = Agent(model=MODEL)
+processing = False
+submitted_data = None
+@app.route('/get_question_and_facts', methods=['GET'])
+def get_response():
+    global submitted_data, processing, agent
+    print(submitted_data)
+    if not submitted_data:
+        response = GetQuestionAndFactsResponse(
+            question='',
+            facts=[],
+            status='No data found.'
+        )
+        return jsonify(response.dict()), 200
+    if processing:
+        response = GetQuestionAndFactsResponse(
+            question=submitted_data.question,
+            facts=[],
+            status='processing'
+        )
+        return jsonify(response.dict()), 200
+    response = GetQuestionAndFactsResponse(
+        question=submitted_data.question,
+        facts=agent.get_response_list(),
+        status='done'
+    )
+    return jsonify(response.dict()), 200
+@app.route('/submit_question_and_documents', methods=['POST'])
+def submit_question():
+    global submitted_data, processing, agent
+    processing = True
+    request_content = request.get_json()
+    submitted_data = SubmitQuestionAndDocumentRequest(**request_content)
+    logs = read_documents(submitted_data.urls)
+    processed_logs = preprocess_logs(logs)
+    agent.process_request(
+        question=submitted_data.question,
+        logs=processed_logs
+    )
+    processing = False
+    response = SubmitQuestionAndDocumentsResponse()
+    return jsonify(response.dict()), 200
+if __name__ == '__main__':
+    app.run(host='0.0.0.0', port=8000, debug=True)

app/config.py ADDED Viewed

	@@ -0,0 +1,40 @@

+template = """
+You are a call log summarization agent. Your job is to extract call summary bulletins only related to the question from a sequence of call logs. Please answer with bullets points only. Do not repeat facts in different bullets, and only response on facts with final decisions, avoid include previous decisions or decision process. Above are some examples of responses.\nGive response to the following question: {question}, according to the meeting logs:\n{logs}
+"""
+template_v2 = """
+You are a call log summarization agent. Your task is to process and extract relevant information from a set of call logs based on a single question provided.
+Provide a concise list of facts extracted from the call logs that directly answer the question.
+Avoid including the conversation process of the facts in your response.
+Provide only the list, without any other text. Each bullet should only contain one single fact.
+Please be mindful of updated facts/information/decisions and exclude any that have been canceled.
+Above are some response examples.
+Question: {question}
+List of Call Logs:
+{logs}
+"""
+example_template = """Question: {question}
+List of Call Logs:
+{logs}
+Answer:
+{answer}"""
+examples = [
+    {'logs': "00:00:10 - Alex: Let's choose our app's color scheme today.\n00:00:36 - Jordan: I suggest blue for a calm feel.\n00:00:51 - Casey: We need to make sure it's accessible to all users.",
+     'question': 'What product design decisions did the team make?',
+     'answer': "- The team will use blue for the color scheme of the app.\n- The team will make the app accessible to all users."},
+    {'logs': "1\n00:01:11,430 --> 00:01:40,520\n John: Hello, everybody. Let's start with the product design discussion. I think we should go with a modular design for our product. It will allow us to easily add or remove features as needed.\n\n2\n00:01:41,450 --> 00:01:49,190\nSara: I agree with John. A modular design will provide us with the flexibility we need. Also, I suggest we use a responsive design to ensure our product works well on all devices. Finally, I think we should use websockets to improve latency and provide real-time updates.\n\n3\n00:01:49,340 --> 00:01:50,040\nMike: Sounds good to me. I also propose we use a dark theme for the user interface. It's trendy and reduces eye strain for users. Let's hold off on the websockets for now since it's a little bit too much work.",
+     'question': 'What are our product design decisions?',
+     'answer': "- The team has decided to go with a modular design for the product.\n- The team has decided to use a responsive design to ensure the product works well on all devices.\n- The team has decided to use a dark theme for the user interface."},
+    {'logs': "1\n00:01:11,430 --> 00:01:40,520\nJohn: After giving it some more thought, I believe we should also consider a light theme option for the user interface. This will cater to users who prefer a brighter interface.\n\n2\n00:01:41,450 --> 00:01:49,190\nSara: That's a great idea, John. A light theme will provide an alternative to users who find the dark theme too intense.\n\n3\n00:01:49,340 --> 00:01:50,040\nMike: I'm on board with that.",
+     'question': 'What are our product design decisions?',
+     'answer': "- The team has decided to go with a modular design for the product.\n- The team has decided to use a responsive design to ensure the product works well on all devices.\n- The team has decided to provide both dark and light theme options for the user interface."},
+    {'logs': "1\n00:01:11,430 --> 00:01:40,520\nJohn: I've been thinking about our decision on the responsive design. While it's important to ensure our product works well on all devices, I think we should focus on desktop first. Our primary users will be using our product on desktops.\n\n2\n00:01:41,450 --> 00:01:49,190\nSara: I see your point, John. Focusing on desktop first will allow us to better cater to our primary users. I agree with this change.\n\n3\n00:01:49,340 --> 00:01:50,040\nMike: I agree as well. I also think the idea of using a modular design doesn't make sense. Let's not make that decision yet.",
+     'question': 'What are our product design decisions?',
+     'answer': "- The team has decided to focus on a desktop-first design\n- The team has decided to provide both dark and light theme options for the user interface."},
+]
+MODEL = 'gpt-4'

app/models.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from pydantic import BaseModel
+from typing import Optional, List
+class GetQuestionAndFactsResponse(BaseModel):
+    question: str
+    facts: Optional[List[str]]
+    status: str
+class SubmitQuestionAndDocumentsResponse(BaseModel):
+    pass
+class SubmitQuestionAndDocumentRequest(BaseModel):
+    question: str
+    urls: List[str]

app/ui.py ADDED Viewed

	@@ -0,0 +1,70 @@

+import time
+import requests
+import gradio as gr
+from utils import get_url_list
+from models import SubmitQuestionAndDocumentRequest, GetQuestionAndFactsResponse
+base_url = 'https://cleric-agent-ad76f992e8d8.herokuapp.com/'
+def fetch_facts(question, call_log_urls):
+    urls = get_url_list(call_log_urls)
+    payload = SubmitQuestionAndDocumentRequest(
+        question=question,
+        urls=urls
+    ).dict()
+    response = requests.post(f"{base_url}/submit_question_and_documents", json=payload)
+    start_time = time.time()
+    while True:
+        response = requests.get(f"{base_url}/get_question_and_facts")
+        if response.status_code != 200:
+            # st.error(f"Unexpected status code when getting question and facts: {response.status_code}")
+            return None
+        try:
+            data = GetQuestionAndFactsResponse(**response.json())
+        except ValueError as e:
+            # st.error(f"The response data does not match the expected schema: {str(e)}")
+            # st.write(response.json())  # Print the invalid data for debugging
+            return None
+        if data.status == "done":
+            break
+        elif time.time() - start_time > 300:  # 5 minutes timeout
+            # st.error("Timeout: Facts not ready after 5 minutes")
+            return None
+        time.sleep(1)
+    return '\n'.join(data.facts)
+with gr.Blocks() as demo:
+    gr.Markdown("""
+    # Cleric Call Logs Summarize Agent
+    Please place the URLs in the Call Logs URLs text box, separated by new line.
+    Place your question to this call logs, then submit!
+    """)
+    error_box = gr.Textbox(label="Error", visible=False)
+    with gr.Row(equal_height=True):
+        call_logs_box = gr.Textbox(label='Call Logs URLs', scale=2)
+        facts_box = gr.Textbox(label='Extracted Facts', scale=2)
+    question_box = gr.Textbox(label='Question')
+    submit_btn = gr.Button("Submit")
+    submit_btn.click(
+        fetch_facts,
+        inputs=[call_logs_box, question_box],
+        outputs=facts_box
+    )
+# iface = gr.Interface(
+#     fn=fetch_facts,
+#     inputs=["text", "text"],
+#     outputs="text",
+#     allow_flagging="never",
+#     title="Cleric Call Logs Summarize Agent"
+# )
+demo.launch()

app/utils.py ADDED Viewed

	@@ -0,0 +1,28 @@

+import requests
+from typing import List
+def load_logs(log_paths: List) -> str:
+    logs = ""
+    for i, path in enumerate(log_paths):
+        with open(path, 'r') as f:
+            logs += f"Log {i}:\n" + f.read() + '\n'
+    return logs
+def get_url_list(call_log_urls: str) -> List[str]:
+    return call_log_urls.split('\n')
+def read_documents(documents: List[str]) -> List[str]:
+    logs = []
+    for url in documents:
+        response = requests.get(url)
+        logs.append(response.text)
+    return logs
+def preprocess_logs(logs: List[str]):
+    return '\n'.join(logs)

main.py ADDED Viewed

	@@ -0,0 +1,45 @@

+import os
+from config import *
+from pydantic import BaseModel
+from langchain_openai import ChatOpenAI
+from utils import load_logs, read_documents, preprocess_logs
+from langchain_core.prompts import FewShotPromptTemplate, PromptTemplate
+llm = ChatOpenAI(model=MODEL)
+class SubmitQuestionAndDocumentsResponse(BaseModel):
+    pass  # The response body doesn't matter for this endpoint
+if __name__ == '__main__':
+    documents = [
+        "https://storage.googleapis.com/cleric-assignment-call-logs/call_log_20240314_104111.txt",
+        "https://storage.googleapis.com/cleric-assignment-call-logs/call_log_20240315_104111.txt",
+        "https://storage.googleapis.com/cleric-assignment-call-logs/call_log_20240316_104111.txt"
+    ]
+    logs = read_documents(documents)
+    processed_logs = preprocess_logs(logs)
+    example_prompt = PromptTemplate(
+        template=example_template,
+        input_variables=["question", "logs", "answer"]
+    )
+    prompt = FewShotPromptTemplate(
+        examples=examples,
+        example_prompt=example_prompt,
+        suffix=template,
+        input_variables=["question", "logs"]
+    )
+    prompt_formatted = prompt.format(
+        question='What product design decisions did the team make?',
+        logs=processed_logs
+    )
+    print(prompt_formatted)
+    # bullets = llm.predict(prompt_formatted)
+    # print(bullets)

requirements.txt ADDED Viewed

	@@ -0,0 +1,7 @@

+Flask
+openai
+pydantic
+langchain
+langchain-openai
+pydantic
+gunicorn