slide-deck-ai / chat_app.py
barunsaha's picture
Add exception handling for JSON parsing and slide deck generation
3919051
raw
history blame
7.3 kB
import datetime
import logging
import pathlib
import random
import tempfile
from typing import List
import json5
import streamlit as st
from langchain_community.chat_message_histories import (
StreamlitChatMessageHistory
)
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.runnables.history import RunnableWithMessageHistory
from global_config import GlobalConfig
from helpers import llm_helper, pptx_helper
APP_TEXT = json5.loads(open(GlobalConfig.APP_STRINGS_FILE, 'r', encoding='utf-8').read())
DOWNLOAD_FILE_KEY = 'download_file_name'
# langchain.debug = True
# langchain.verbose = True
logger = logging.getLogger(__name__)
progress_bar = st.progress(0, text='Setting up SlideDeck AI...')
texts = list(GlobalConfig.PPTX_TEMPLATE_FILES.keys())
captions = [GlobalConfig.PPTX_TEMPLATE_FILES[x]['caption'] for x in texts]
pptx_template = st.sidebar.radio(
'Select a presentation template:',
texts,
captions=captions,
horizontal=True
)
def display_page_header_content():
"""
Display content in the page header.
"""
st.title(APP_TEXT['app_name'])
st.subheader(APP_TEXT['caption'])
st.markdown(
'Powered by'
' [Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2)'
)
def display_page_footer_content():
"""
Display content in the page footer.
"""
st.text(APP_TEXT['tos'] + '\n\n' + APP_TEXT['tos2'])
# st.markdown(
# '![Visitors](https://api.visitorbadge.io/api/visitors?path=https%3A%2F%2Fhuggingface.co%2Fspaces%2Fbarunsaha%2Fslide-deck-ai&countColor=%23263759)' # noqa: E501
# )
def build_ui():
"""
Display the input elements for content generation.
"""
display_page_header_content()
with st.expander('Usage Policies and Limitations'):
display_page_footer_content()
progress_bar.progress(50, text='Setting up chat interface...')
set_up_chat_ui()
def set_up_chat_ui():
"""
Prepare the chat interface and related functionality.
"""
history = StreamlitChatMessageHistory(key='chat_messages')
llm = llm_helper.get_hf_endpoint()
with open(GlobalConfig.CHAT_TEMPLATE_FILE, 'r', encoding='utf-8') as in_file:
template = in_file.read()
prompt = ChatPromptTemplate.from_template(template)
chain = prompt | llm
chain_with_history = RunnableWithMessageHistory(
chain,
lambda session_id: history, # Always return the instance created earlier
input_messages_key='question',
history_messages_key='chat_history',
)
with st.expander('Usage Instructions'):
st.write(GlobalConfig.CHAT_USAGE_INSTRUCTIONS)
st.chat_message('ai').write(
random.choice(APP_TEXT['ai_greetings'])
)
for msg in history.messages:
# st.chat_message(msg.type).markdown(msg.content)
st.chat_message(msg.type).code(msg.content, language='json')
# The download button disappears on clicking (anywhere) because of app reload
# So, display it again
if DOWNLOAD_FILE_KEY in st.session_state:
_display_download_button(st.session_state[DOWNLOAD_FILE_KEY])
progress_bar.progress(100, text='Done!')
progress_bar.empty()
if prompt := st.chat_input(
placeholder=APP_TEXT['chat_placeholder'],
max_chars=GlobalConfig.LLM_MODEL_MAX_INPUT_LENGTH
):
logger.debug('User input: %s', prompt)
st.chat_message('user').write(prompt)
progress_bar_pptx = st.progress(0, 'Calling LLM...')
# As usual, new messages are added to StreamlitChatMessageHistory when the Chain is called
config = {'configurable': {'session_id': 'any'}}
response: str = chain_with_history.invoke({'question': prompt}, config)
st.chat_message('ai').markdown('```json\n' + response)
# The content has been generated as JSON
# There maybe trailing ``` at the end of the response -- remove them
# To be careful: ``` may be part of the content as well when code is generated
response_cleaned = _clean_json(response)
progress_bar_pptx.progress(50, 'Analyzing response...')
# Now create the PPT file
progress_bar_pptx.progress(75, 'Creating the slide deck...give it a moment')
generate_slide_deck(response_cleaned)
progress_bar_pptx.progress(100, text='Done!')
def generate_slide_deck(json_str: str):
"""
Create a slide deck.
:param json_str: The content in *valid* JSON format.
"""
if DOWNLOAD_FILE_KEY in st.session_state:
path = pathlib.Path(st.session_state[DOWNLOAD_FILE_KEY])
logger.debug('DOWNLOAD_FILE_KEY found in session')
else:
temp = tempfile.NamedTemporaryFile(delete=False, suffix='.pptx')
path = pathlib.Path(temp.name)
st.session_state[DOWNLOAD_FILE_KEY] = str(path)
logger.debug('DOWNLOAD_FILE_KEY not found in session')
logger.debug('Creating PPTX file: %s...', st.session_state[DOWNLOAD_FILE_KEY])
try:
pptx_helper.generate_powerpoint_presentation(
json_str,
slides_template=pptx_template,
output_file_path=path
)
_display_download_button(path)
except ValueError as ve:
st.error(APP_TEXT['json_parsing_error'])
logger.error('%s', APP_TEXT['json_parsing_error'])
logger.error('Additional error info: %s', str(ve))
except Exception as ex:
st.error(APP_TEXT['content_generation_error'])
logger.error('Caught a generic exception: %s', str(ex))
def _clean_json(json_str: str) -> str:
"""
Attempt to clean a JSON response string from the LLM by removing the trailing ```
and any text beyond that. May not be always accurate.
:param json_str: The input string in JSON format.
:return: The "cleaned" JSON string.
"""
str_len = len(json_str)
response_cleaned = json_str
try:
idx = json_str.rindex('```')
logger.debug(
'Fixing JSON response: str_len: %d, idx of ```: %d',
str_len, idx
)
if idx + 3 == str_len:
# The response ends with ``` -- most likely the end of JSON response string
response_cleaned = json_str[:idx]
elif idx + 3 < str_len:
# Looks like there are some more content beyond the last ```
# In the best case, it would be some additional plain-text response from the LLM
# and is unlikely to contain } or ] that are present in JSON
if '}' not in json_str[idx + 3:]: # the remainder of the text
response_cleaned = json_str[:idx]
except ValueError:
# No ``` found
pass
return response_cleaned
def _display_download_button(file_path: pathlib.Path):
"""
Display a download button to download a slide deck.
:param file_path: The path of the .pptx file.
"""
with open(file_path, 'rb') as download_file:
st.download_button(
'Download PPTX file ⬇️',
data=download_file,
file_name='Presentation.pptx',
key=datetime.datetime.now()
)
def main():
"""
Trigger application run.
"""
build_ui()
if __name__ == '__main__':
main()