Spaces:
Running
Running
import datetime | |
import logging | |
import pathlib | |
import random | |
import tempfile | |
from typing import List | |
import json5 | |
import streamlit as st | |
from langchain_community.chat_message_histories import ( | |
StreamlitChatMessageHistory | |
) | |
from langchain_core.prompts import ChatPromptTemplate | |
from langchain_core.runnables.history import RunnableWithMessageHistory | |
from global_config import GlobalConfig | |
from helpers import llm_helper, pptx_helper | |
def _load_strings() -> dict: | |
""" | |
Load various strings to be displayed in the app. | |
:return: The dictionary of strings. | |
""" | |
with open(GlobalConfig.APP_STRINGS_FILE, 'r', encoding='utf-8') as in_file: | |
return json5.loads(in_file.read()) | |
APP_TEXT = _load_strings() | |
DOWNLOAD_FILE_KEY = 'download_file_name' | |
# langchain.debug = True | |
# langchain.verbose = True | |
logger = logging.getLogger(__name__) | |
progress_bar = st.progress(0, text='Setting up SlideDeck AI...') | |
texts = list(GlobalConfig.PPTX_TEMPLATE_FILES.keys()) | |
captions = [GlobalConfig.PPTX_TEMPLATE_FILES[x]['caption'] for x in texts] | |
pptx_template = st.sidebar.radio( | |
'Select a presentation template:', | |
texts, | |
captions=captions, | |
horizontal=True | |
) | |
def display_page_header_content(): | |
""" | |
Display content in the page header. | |
""" | |
st.title(APP_TEXT['app_name']) | |
st.subheader(APP_TEXT['caption']) | |
st.markdown( | |
'Powered by' | |
' [Mistral-7B-Instruct-v0.2](https://huggingface.co/mistralai/Mistral-7B-Instruct-v0.2)' | |
) | |
def display_page_footer_content(): | |
""" | |
Display content in the page footer. | |
""" | |
st.text(APP_TEXT['tos'] + '\n\n' + APP_TEXT['tos2']) | |
# st.markdown( | |
# '' # noqa: E501 | |
# ) | |
def build_ui(): | |
""" | |
Display the input elements for content generation. | |
""" | |
display_page_header_content() | |
with st.expander('Usage Policies and Limitations'): | |
display_page_footer_content() | |
progress_bar.progress(50, text='Setting up chat interface...') | |
set_up_chat_ui() | |
def set_up_chat_ui(): | |
""" | |
Prepare the chat interface and related functionality. | |
""" | |
history = StreamlitChatMessageHistory(key='chat_messages') | |
llm = llm_helper.get_hf_endpoint() | |
with open(GlobalConfig.CHAT_TEMPLATE_FILE, 'r', encoding='utf-8') as in_file: | |
template = in_file.read() | |
prompt = ChatPromptTemplate.from_template(template) | |
chain = prompt | llm | |
chain_with_history = RunnableWithMessageHistory( | |
chain, | |
lambda session_id: history, # Always return the instance created earlier | |
input_messages_key='question', | |
history_messages_key='chat_history', | |
) | |
with st.expander('Usage Instructions'): | |
st.write(GlobalConfig.CHAT_USAGE_INSTRUCTIONS) | |
st.chat_message('ai').write( | |
random.choice(APP_TEXT['ai_greetings']) | |
) | |
for msg in history.messages: | |
# st.chat_message(msg.type).markdown(msg.content) | |
st.chat_message(msg.type).code(msg.content, language='json') | |
# The download button disappears on clicking (anywhere) because of app reload | |
# So, display it again | |
if DOWNLOAD_FILE_KEY in st.session_state: | |
_display_download_button(st.session_state[DOWNLOAD_FILE_KEY]) | |
progress_bar.progress(100, text='Done!') | |
progress_bar.empty() | |
if prompt := st.chat_input( | |
placeholder=APP_TEXT['chat_placeholder'], | |
max_chars=GlobalConfig.LLM_MODEL_MAX_INPUT_LENGTH | |
): | |
logger.info('User input: %s', prompt) | |
st.chat_message('user').write(prompt) | |
progress_bar_pptx = st.progress(0, 'Calling LLM...') | |
# As usual, new messages are added to StreamlitChatMessageHistory when the Chain is called | |
config = {'configurable': {'session_id': 'any'}} | |
response: str = chain_with_history.invoke({'question': prompt}, config) | |
st.chat_message('ai').markdown('```json\n' + response) | |
# The content has been generated as JSON | |
# There maybe trailing ``` at the end of the response -- remove them | |
# To be careful: ``` may be part of the content as well when code is generated | |
response_cleaned = _clean_json(response) | |
progress_bar_pptx.progress(50, 'Analyzing response...') | |
# Now create the PPT file | |
progress_bar_pptx.progress(75, 'Creating the slide deck...give it a moment') | |
generate_slide_deck(response_cleaned) | |
progress_bar_pptx.progress(100, text='Done!') | |
def generate_slide_deck(json_str: str): | |
""" | |
Create a slide deck. | |
:param json_str: The content in *valid* JSON format. | |
""" | |
if DOWNLOAD_FILE_KEY in st.session_state: | |
path = pathlib.Path(st.session_state[DOWNLOAD_FILE_KEY]) | |
logger.debug('DOWNLOAD_FILE_KEY found in session') | |
else: | |
temp = tempfile.NamedTemporaryFile(delete=False, suffix='.pptx') | |
path = pathlib.Path(temp.name) | |
st.session_state[DOWNLOAD_FILE_KEY] = str(path) | |
logger.debug('DOWNLOAD_FILE_KEY not found in session') | |
logger.debug('Creating PPTX file: %s...', st.session_state[DOWNLOAD_FILE_KEY]) | |
try: | |
pptx_helper.generate_powerpoint_presentation( | |
json_str, | |
slides_template=pptx_template, | |
output_file_path=path | |
) | |
_display_download_button(path) | |
except ValueError as ve: | |
st.error(APP_TEXT['json_parsing_error']) | |
logger.error('%s', APP_TEXT['json_parsing_error']) | |
logger.error('Additional error info: %s', str(ve)) | |
except Exception as ex: | |
st.error(APP_TEXT['content_generation_error']) | |
logger.error('Caught a generic exception: %s', str(ex)) | |
def _clean_json(json_str: str) -> str: | |
""" | |
Attempt to clean a JSON response string from the LLM by removing the trailing ``` | |
and any text beyond that. May not be always accurate. | |
:param json_str: The input string in JSON format. | |
:return: The "cleaned" JSON string. | |
""" | |
str_len = len(json_str) | |
response_cleaned = json_str | |
try: | |
idx = json_str.rindex('```') | |
logger.debug( | |
'Fixing JSON response: str_len: %d, idx of ```: %d', | |
str_len, idx | |
) | |
if idx + 3 == str_len: | |
# The response ends with ``` -- most likely the end of JSON response string | |
response_cleaned = json_str[:idx] | |
elif idx + 3 < str_len: | |
# Looks like there are some more content beyond the last ``` | |
# In the best case, it would be some additional plain-text response from the LLM | |
# and is unlikely to contain } or ] that are present in JSON | |
if '}' not in json_str[idx + 3:]: # the remainder of the text | |
response_cleaned = json_str[:idx] | |
except ValueError: | |
# No ``` found | |
pass | |
return response_cleaned | |
def _display_download_button(file_path: pathlib.Path): | |
""" | |
Display a download button to download a slide deck. | |
:param file_path: The path of the .pptx file. | |
""" | |
with open(file_path, 'rb') as download_file: | |
st.download_button( | |
'Download PPTX file ⬇️', | |
data=download_file, | |
file_name='Presentation.pptx', | |
key=datetime.datetime.now() | |
) | |
def main(): | |
""" | |
Trigger application run. | |
""" | |
build_ui() | |
if __name__ == '__main__': | |
main() | |