import datetime import logging import pathlib import random import tempfile from typing import List import json5 import streamlit as st from langchain_community.chat_message_histories import ( StreamlitChatMessageHistory ) from langchain_core.prompts import ChatPromptTemplate from langchain_core.runnables.history import RunnableWithMessageHistory from global_config import GlobalConfig from helpers import llm_helper, pptx_helper APP_TEXT = json5.loads(open(GlobalConfig.APP_STRINGS_FILE, 'r', encoding='utf-8').read()) DOWNLOAD_FILE_KEY = 'download_file_name' # langchain.debug = True # langchain.verbose = True logger = logging.getLogger(__name__) progress_bar = st.progress(0, text='Setting up SlideDeck AI...') texts = list(GlobalConfig.PPTX_TEMPLATE_FILES.keys()) captions = [GlobalConfig.PPTX_TEMPLATE_FILES[x]['caption'] for x in texts] pptx_template = st.sidebar.radio( 'Select a presentation template:', texts, captions=captions, horizontal=True ) def display_page_header_content(): """ Display content in the page header. """ st.title(APP_TEXT['app_name']) st.subheader(APP_TEXT['caption']) st.markdown( 'Powered by' ' [Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2)' ) def display_page_footer_content(): """ Display content in the page footer. """ st.text(APP_TEXT['tos'] + '\n\n' + APP_TEXT['tos2']) # st.markdown( # '![Visitors](https://api.visitorbadge.io/api/visitors?path=https%3A%2F%2Fhuggingface.co%2Fspaces%2Fbarunsaha%2Fslide-deck-ai&countColor=%23263759)' # noqa: E501 # ) def build_ui(): """ Display the input elements for content generation. """ display_page_header_content() with st.expander('Usage Policies and Limitations'): display_page_footer_content() progress_bar.progress(50, text='Setting up chat interface...') set_up_chat_ui() def set_up_chat_ui(): """ Prepare the chat interface and related functionality. """ history = StreamlitChatMessageHistory(key='chat_messages') llm = llm_helper.get_hf_endpoint() with open(GlobalConfig.CHAT_TEMPLATE_FILE, 'r', encoding='utf-8') as in_file: template = in_file.read() prompt = ChatPromptTemplate.from_template(template) chain = prompt | llm chain_with_history = RunnableWithMessageHistory( chain, lambda session_id: history, # Always return the instance created earlier input_messages_key='question', history_messages_key='chat_history', ) with st.expander('Usage Instructions'): st.write(GlobalConfig.CHAT_USAGE_INSTRUCTIONS) st.chat_message('ai').write( random.choice(APP_TEXT['ai_greetings']) ) for msg in history.messages: # st.chat_message(msg.type).markdown(msg.content) st.chat_message(msg.type).code(msg.content, language='json') # The download button disappears on clicking (anywhere) because of app reload # So, display it again if DOWNLOAD_FILE_KEY in st.session_state: _display_download_button(st.session_state[DOWNLOAD_FILE_KEY]) progress_bar.progress(100, text='Done!') progress_bar.empty() if prompt := st.chat_input( placeholder=APP_TEXT['chat_placeholder'], max_chars=GlobalConfig.LLM_MODEL_MAX_INPUT_LENGTH ): logger.debug('User input: %s', prompt) st.chat_message('user').write(prompt) progress_bar_pptx = st.progress(0, 'Calling LLM...') # As usual, new messages are added to StreamlitChatMessageHistory when the Chain is called config = {'configurable': {'session_id': 'any'}} response: str = chain_with_history.invoke({'question': prompt}, config) st.chat_message('ai').markdown('```json\n' + response) # The content has been generated as JSON # There maybe trailing ``` at the end of the response -- remove them # To be careful: ``` may be part of the content as well when code is generated response_cleaned = _clean_json(response) progress_bar_pptx.progress(50, 'Analyzing response...') # Now create the PPT file progress_bar_pptx.progress(75, 'Creating the slide deck...give it a moment') generate_slide_deck(response_cleaned) progress_bar_pptx.progress(100, text='Done!') def generate_slide_deck(json_str: str): """ Create a slide deck. :param json_str: The content in *valid* JSON format. """ if DOWNLOAD_FILE_KEY in st.session_state: path = pathlib.Path(st.session_state[DOWNLOAD_FILE_KEY]) logger.debug('DOWNLOAD_FILE_KEY found in session') else: temp = tempfile.NamedTemporaryFile(delete=False, suffix='.pptx') path = pathlib.Path(temp.name) st.session_state[DOWNLOAD_FILE_KEY] = str(path) logger.debug('DOWNLOAD_FILE_KEY not found in session') logger.debug('Creating PPTX file: %s...', st.session_state[DOWNLOAD_FILE_KEY]) try: pptx_helper.generate_powerpoint_presentation( json_str, slides_template=pptx_template, output_file_path=path ) _display_download_button(path) except ValueError as ve: st.error(APP_TEXT['json_parsing_error']) logger.error('%s', APP_TEXT['json_parsing_error']) logger.error('Additional error info: %s', str(ve)) except Exception as ex: st.error(APP_TEXT['content_generation_error']) logger.error('Caught a generic exception: %s', str(ex)) def _clean_json(json_str: str) -> str: """ Attempt to clean a JSON response string from the LLM by removing the trailing ``` and any text beyond that. May not be always accurate. :param json_str: The input string in JSON format. :return: The "cleaned" JSON string. """ str_len = len(json_str) response_cleaned = json_str try: idx = json_str.rindex('```') logger.debug( 'Fixing JSON response: str_len: %d, idx of ```: %d', str_len, idx ) if idx + 3 == str_len: # The response ends with ``` -- most likely the end of JSON response string response_cleaned = json_str[:idx] elif idx + 3 < str_len: # Looks like there are some more content beyond the last ``` # In the best case, it would be some additional plain-text response from the LLM # and is unlikely to contain } or ] that are present in JSON if '}' not in json_str[idx + 3:]: # the remainder of the text response_cleaned = json_str[:idx] except ValueError: # No ``` found pass return response_cleaned def _display_download_button(file_path: pathlib.Path): """ Display a download button to download a slide deck. :param file_path: The path of the .pptx file. """ with open(file_path, 'rb') as download_file: st.download_button( 'Download PPTX file ⬇️', data=download_file, file_name='Presentation.pptx', key=datetime.datetime.now() ) def main(): """ Trigger application run. """ build_ui() if __name__ == '__main__': main()