Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
import gradio as gr | |
import pandas as pd | |
import numpy as np | |
import os | |
import time | |
import re | |
import json | |
from auditqa.sample_questions import QUESTIONS | |
from auditqa.reports import POSSIBLE_REPORTS | |
from auditqa.engine.prompts import audience_prompts | |
from auditqa.doc_process import process_markdown, process_pdf | |
from auditqa.engine.vectorstore import create_vectorstore | |
# process files | |
# process_markdown() | |
docs = process_pdf() | |
create_vectorstore(docs) | |
async def chat(query,history,audience,sources,reports): | |
"""taking a query and a message history, use a pipeline (reformulation, retriever, answering) to yield a tuple of: | |
(messages in gradio format, messages in langchain format, source documents)""" | |
print(f">> NEW QUESTION : {query}") | |
print(f"history:{history}") | |
print(f"audience:{audience}") | |
print(f"sources:{sources}") | |
print(f"reports:{reports}") | |
if audience == "Children": | |
audience_prompt = audience_prompts["children"] | |
elif audience == "General public": | |
audience_prompt = audience_prompts["general"] | |
elif audience == "Experts": | |
audience_prompt = audience_prompts["experts"] | |
else: | |
audience_prompt = audience_prompts["experts"] | |
# Prepare default values | |
if len(sources) == 0: | |
sources = ["IPCC"] | |
if len(reports) == 0: | |
reports = [] | |
history = [tuple(x) for x in history] | |
docs_html = "" | |
output_query = "" | |
output_language = "ENG" | |
yield history,docs_html,output_query,output_language | |
# -------------------------------------------------------------------- | |
# Gradio | |
# -------------------------------------------------------------------- | |
# Set up Gradio Theme | |
theme = gr.themes.Base( | |
primary_hue="blue", | |
secondary_hue="red", | |
font=[gr.themes.GoogleFont("Poppins"), "ui-sans-serif", "system-ui", "sans-serif"], | |
) | |
init_prompt = """ | |
Hello, I am Audit Q&A, a conversational assistant designed to help you understand audit Reports. I will answer your questions by **crawling through the Audit reports publishsed by Auditor General Office**. | |
❓ How to use | |
- **Language**: You can ask me your questions in any language. | |
- **Audience**: You can specify your audience (children, general public, experts) to get a more adapted answer. | |
- **Sources**: You can choose to search in the Annual or District or Department focused reports, or all. | |
⚠️ Limitations | |
*Please note that the AI is not perfect and may sometimes give irrelevant answers. If you are not satisfied with the answer, please ask a more specific question or report your feedback to help us improve the system.* | |
What do you want to learn ? | |
""" | |
# Setting Tabs | |
with gr.Blocks(title="Audit Q&A", css="style.css", theme=theme,elem_id = "main-component") as demo: | |
# user_id_state = gr.State([user_id]) | |
with gr.Tab("AuditQ&A"): | |
with gr.Row(elem_id="chatbot-row"): | |
with gr.Column(scale=2): | |
# state = gr.State([system_template]) | |
chatbot = gr.Chatbot( | |
value=[(None,init_prompt)], | |
show_copy_button=True,show_label = False,elem_id="chatbot",layout = "panel", | |
avatar_images = (None,"https://i.ibb.co/YNyd5W2/logo4.png"), | |
)#,avatar_images = ("assets/logo4.png",None)) | |
# bot.like(vote,None,None) | |
with gr.Row(elem_id = "input-message"): | |
textbox=gr.Textbox(placeholder="Ask me anything here!",show_label=False,scale=7,lines = 1,interactive = True,elem_id="input-textbox") | |
# submit = gr.Button("",elem_id = "submit-button",scale = 1,interactive = True,icon = "https://static-00.iconduck.com/assets.00/settings-icon-2048x2046-cw28eevx.png") | |
with gr.Column(scale=1, variant="panel",elem_id = "right-panel"): | |
with gr.Tabs() as tabs: | |
with gr.TabItem("Examples",elem_id = "tab-examples",id = 0): | |
examples_hidden = gr.Textbox(visible = False) | |
first_key = list(QUESTIONS.keys())[0] | |
dropdown_samples = gr.Dropdown(QUESTIONS.keys(),value = first_key,interactive = True,show_label = True,label = "Select a category of sample questions",elem_id = "dropdown-samples") | |
samples = [] | |
for i,key in enumerate(QUESTIONS.keys()): | |
examples_visible = True if i == 0 else False | |
with gr.Row(visible = examples_visible) as group_examples: | |
examples_questions = gr.Examples( | |
QUESTIONS[key], | |
[examples_hidden], | |
examples_per_page=8, | |
run_on_click=False, | |
elem_id=f"examples{i}", | |
api_name=f"examples{i}", | |
# label = "Click on the example question or enter your own", | |
# cache_examples=True, | |
) | |
samples.append(group_examples) | |
with gr.Tab("Sources",elem_id = "tab-citations",id = 1): | |
sources_textbox = gr.HTML(show_label=False, elem_id="sources-textbox") | |
docs_textbox = gr.State("") | |
# with Modal(visible = False) as config_modal: | |
with gr.Tab("Configuration",elem_id = "tab-config",id = 2): | |
gr.Markdown("Reminder: You can talk in any language, Audit Q&A is multi-lingual!") | |
dropdown_sources = gr.CheckboxGroup( | |
["Consolidated", "MWTS"], | |
label="Select source", | |
value=["Consolidated"], | |
interactive=True, | |
) | |
dropdown_reports = gr.Dropdown( | |
POSSIBLE_REPORTS, | |
label="Or select specific reports", | |
multiselect=True, | |
value=None, | |
interactive=True, | |
) | |
dropdown_audience = gr.Dropdown( | |
["Children","General public","Experts"], | |
label="Select audience", | |
value="Experts", | |
interactive=True, | |
) | |
output_query = gr.Textbox(label="Query used for retrieval",show_label = True,elem_id = "reformulated-query",lines = 2,interactive = False) | |
output_language = gr.Textbox(label="Language",show_label = True,elem_id = "language",lines = 1,interactive = False) | |
with gr.Tab("About",elem_classes = "max-height other-tabs"): | |
with gr.Row(): | |
with gr.Column(scale=1): | |
gr.Markdown("See more info at [https://www.oag.go.ug/](https://www.oag.go.ug/welcome)") | |
def start_chat(query,history): | |
history = history + [(query,None)] | |
history = [tuple(x) for x in history] | |
return (gr.update(interactive = False),gr.update(selected=1),history) | |
def finish_chat(): | |
return (gr.update(interactive = True,value = "")) | |
(textbox | |
.submit(start_chat, [textbox,chatbot], [textbox,tabs,chatbot],queue = False,api_name = "start_chat_textbox") | |
.then(chat, [textbox,chatbot,dropdown_audience, dropdown_sources,dropdown_reports], [chatbot,sources_textbox,output_query,output_language],concurrency_limit = 8,api_name = "chat_textbox") | |
.then(finish_chat, None, [textbox],api_name = "finish_chat_textbox") | |
) | |
(examples_hidden | |
.change(start_chat, [examples_hidden,chatbot], [textbox,tabs,chatbot],queue = False,api_name = "start_chat_examples") | |
.then(chat, [examples_hidden,chatbot,dropdown_audience, dropdown_sources,dropdown_reports], [chatbot,sources_textbox,output_query,output_language],concurrency_limit = 8,api_name = "chat_examples") | |
.then(finish_chat, None, [textbox],api_name = "finish_chat_examples") | |
) | |
def change_sample_questions(key): | |
index = list(QUESTIONS.keys()).index(key) | |
visible_bools = [False] * len(samples) | |
visible_bools[index] = True | |
return [gr.update(visible=visible_bools[i]) for i in range(len(samples))] | |
dropdown_samples.change(change_sample_questions,dropdown_samples,samples) | |
demo.queue() | |
demo.launch() |