import pathlib import logging import tempfile from typing import List, Tuple import json5 import metaphor_python as metaphor import streamlit as st import llm_helper import pptx_helper from global_config import GlobalConfig APP_TEXT = json5.loads(open(GlobalConfig.APP_STRINGS_FILE, 'r', encoding='utf-8').read()) GB_CONVERTER = 2 ** 30 logging.basicConfig( level=GlobalConfig.LOG_LEVEL, format='%(asctime)s - %(message)s', ) @st.cache_data def get_contents_wrapper(text: str) -> str: """ Fetch and cache the slide deck contents on a topic by calling an external API. :param text: The presentation topic :return: The slide deck contents or outline in JSON format """ logging.info('LLM call because of cache miss...') return llm_helper.generate_slides_content(text).strip() @st.cache_resource def get_metaphor_client_wrapper() -> metaphor.Metaphor: """ Create a Metaphor client for semantic Web search. :return: Metaphor instance """ return metaphor.Metaphor(api_key=GlobalConfig.METAPHOR_API_KEY) @st.cache_data def get_web_search_results_wrapper(text: str) -> List[Tuple[str, str]]: """ Fetch and cache the Web search results on a given topic. :param text: The topic :return: A list of (title, link) tuples """ results = [] search_results = get_metaphor_client_wrapper().search( text, use_autoprompt=True, num_results=5 ) for a_result in search_results.results: results.append((a_result.title, a_result.url)) return results # def get_disk_used_percentage() -> float: # """ # Compute the disk usage. # # :return: Percentage of the disk space currently used # """ # # total, used, free = shutil.disk_usage(__file__) # total = total // GB_CONVERTER # used = used // GB_CONVERTER # free = free // GB_CONVERTER # used_perc = 100.0 * used / total # # logging.debug(f'Total: {total} GB\n' # f'Used: {used} GB\n' # f'Free: {free} GB') # # logging.debug('\n'.join(os.listdir())) # # return used_perc def build_ui(): """ Display the input elements for content generation. Only covers the first step. """ # get_disk_used_percentage() st.title(APP_TEXT['app_name']) st.subheader(APP_TEXT['caption']) st.markdown( 'Powered by' ' [Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2).' ) st.markdown( '*If the JSON is generated or parsed incorrectly, try again later by making minor changes' ' to the input text.*' ) with st.form('my_form'): # Topic input try: with open(GlobalConfig.PRELOAD_DATA_FILE, 'r', encoding='utf-8') as in_file: preload_data = json5.loads(in_file.read()) except (FileExistsError, FileNotFoundError): preload_data = {'topic': '', 'audience': ''} topic = st.text_area( APP_TEXT['input_labels'][0], value=preload_data['topic'] ) texts = list(GlobalConfig.PPTX_TEMPLATE_FILES.keys()) captions = [GlobalConfig.PPTX_TEMPLATE_FILES[x]['caption'] for x in texts] pptx_template = st.radio( 'Select a presentation template:', texts, captions=captions, horizontal=True ) st.divider() submit = st.form_submit_button('Generate slide deck') if submit: # st.write(f'Clicked {time.time()}') st.session_state.submitted = True # https://github.com/streamlit/streamlit/issues/3832#issuecomment-1138994421 if 'submitted' in st.session_state: progress_text = 'Generating the slides...give it a moment' progress_bar = st.progress(0, text=progress_text) topic_txt = topic.strip() generate_presentation(topic_txt, pptx_template, progress_bar) st.divider() st.text(APP_TEXT['tos']) st.text(APP_TEXT['tos2']) st.markdown( '![Visitors]' '(https://api.visitorbadge.io/api/visitors?path=https%3A%2F%2Fhuggingface.co%2Fspaces%2Fbarunsaha%2Fslide-deck-ai&countColor=%23263759)' ) def generate_presentation(topic: str, pptx_template: str, progress_bar): """ Process the inputs to generate the slides. :param topic: The presentation topic based on which contents are to be generated :param pptx_template: The PowerPoint template name to be used :param progress_bar: Progress bar from the page :return: """ topic_length = len(topic) logging.debug('Input length:: topic: %s', topic_length) if topic_length >= 10: logging.debug('Topic: %s', topic) target_length = min(topic_length, GlobalConfig.LLM_MODEL_MAX_INPUT_LENGTH) try: # Step 1: Generate the contents in JSON format using an LLM json_str = process_slides_contents(topic[:target_length], progress_bar) logging.debug('Truncated topic: %s', topic[:target_length]) logging.debug('Length of JSON: %d', len(json_str)) # Step 2: Generate the slide deck based on the template specified if len(json_str) > 0: st.info( 'Tip: The generated content doesn\'t look so great?' ' Need alternatives? Just change your description text and try again.', icon="💡️" ) else: st.error( 'Unfortunately, JSON generation failed, so the next steps would lead' ' to nowhere. Try again or come back later.' ) return all_headers = generate_slide_deck(json_str, pptx_template, progress_bar) # Step 3: Bonus stuff: Web references and AI art show_bonus_stuff(all_headers) except ValueError as ve: st.error(f'Unfortunately, an error occurred: {ve}! ' f'Please change the text, try again later, or report it, sharing your inputs.') else: st.error('Not enough information provided! Please be little more descriptive :)') def process_slides_contents(text: str, progress_bar: st.progress) -> str: """ Convert given text into structured data and display. Update the UI. :param text: The topic description for the presentation :param progress_bar: Progress bar for this step :return: The contents as a JSON-formatted string """ json_str = '' try: logging.info('Calling LLM for content generation on the topic: %s', text) json_str = get_contents_wrapper(text) except Exception as ex: st.error( f'An exception occurred while trying to convert to JSON. It could be because of heavy' f' traffic or something else. Try doing it again or try again later.' f'\nError message: {ex}' ) progress_bar.progress(50, text='Contents generated') with st.expander('The generated contents (in JSON format)'): st.code(json_str, language='json') return json_str def generate_slide_deck(json_str: str, pptx_template: str, progress_bar) -> List: """ Create a slide deck. :param json_str: The contents in JSON format :param pptx_template: The PPTX template name :param progress_bar: Progress bar :return: A list of all slide headers and the title """ progress_text = 'Creating the slide deck...give it a moment' progress_bar.progress(75, text=progress_text) # # Get a unique name for the file to save -- use the session ID # ctx = st_sr.get_script_run_ctx() # session_id = ctx.session_id # timestamp = time.time() # output_file_name = f'{session_id}_{timestamp}.pptx' temp = tempfile.NamedTemporaryFile(delete=False, suffix='.pptx') path = pathlib.Path(temp.name) logging.info('Creating PPTX file...') all_headers = pptx_helper.generate_powerpoint_presentation( json_str, as_yaml=False, slides_template=pptx_template, output_file_path=path ) progress_bar.progress(100, text='Done!') with open(path, 'rb') as f: st.download_button('Download PPTX file', f, file_name='Presentation.pptx') return all_headers def show_bonus_stuff(ppt_headers: List[str]): """ Show bonus stuff for the presentation. :param ppt_headers: A list of the slide headings. """ # Use the presentation title and the slide headers to find relevant info online logging.info('Calling Metaphor search...') ppt_text = ' '.join(ppt_headers) search_results = get_web_search_results_wrapper(ppt_text) md_text_items = [] for (title, link) in search_results: md_text_items.append(f'[{title}]({link})') with st.expander('Related Web references'): st.markdown('\n\n'.join(md_text_items)) logging.info('Done!') # # Avoid image generation. It costs time and an API call, so just limit to the text generation. # with st.expander('AI-generated image on the presentation topic'): # logging.info('Calling SDXL for image generation...') # # img_empty.write('') # # img_text.write(APP_TEXT['image_info']) # image = get_ai_image_wrapper(ppt_text) # # if len(image) > 0: # image = base64.b64decode(image) # st.image(image, caption=ppt_text) # st.info('Tip: Right-click on the image to save it.', icon="💡️") # logging.info('Image added') def main(): """ Trigger application run. """ build_ui() if __name__ == '__main__': main()