AutoPresent / app.py
para-lost's picture
fix bug
79a9bd7
raw
history blame
7.55 kB
import gradio as gr
import os
import openai
import subprocess
import base64
def encode_image(image_path):
with open(image_path, 'rb') as image_file:
return base64.b64encode(image_file.read()).decode('utf-8')
def extract_code_pieces(text: str, concat: bool = True) -> list[str]:
"""Extract code pieces from a text string.
Args:
text: str, model prediciton text.
Rets:
code_pieces: list[str], code pieces in the text.
"""
code_pieces = []
while "```python" in text:
st_idx = text.index("```python") + 10
# end_idx = text.index("```", st_idx)
if "```" in text[st_idx:]:
end_idx = text.index("```", st_idx)
else:
end_idx = len(text)
code_pieces.append(text[st_idx:end_idx].strip())
text = text[end_idx+3:].strip()
if concat: return '\n\n'.join(code_pieces)
return code_pieces
SYSTEM_MESSAGE = """* You are an expert presentation slides designer who creates modern, fashionable, and stylish slides using Python code. Your job is to generate the required PPTX slide by writing and executing a Python script. Make sure to follow the guidelines below and do not skip any of them:
1. Ensure your code can successfully execute. If needed, you can also write tests to verify your code.
2. Maintain proper spacing and arrangements of elements in the slide: make sure to keep sufficient spacing between different elements; do not make elements overlap or overflow to the slide page.
3. Carefully select the colors of text, shapes, and backgrounds, to ensure all contents are readable.
4. The slides should not look empty or incomplete. When filling the content in the slides, maintain good design and layout."""
# INSTRUCTION = """Follow the instruction below to create the slide.
# If the instruction is long and specific, follow the instruction carefully and add all elements as required;
# if it is short and concise, you will need to create some content (text, image, layout) and implement it into the slide.
# {}
# Finally, your code should save the pptx file to path "{}"."""
with open('agent_no_image_new_lib.prompt', 'r') as f:
INSTRUCTION = f.read()
import glob
import time
def list_files_in_directory(directory):
"""Lists all files in the given directory."""
return set(glob.glob(os.path.join(directory, "*")))
def cleanup_temp_files(temp_files):
"""Deletes a list of temporary files if they exist."""
for temp_file in temp_files:
try:
if os.path.exists(temp_file):
os.remove(temp_file)
print(f"Deleted temporary file: {temp_file}")
except Exception as e:
print(f"Failed to delete {temp_file}: {e}")
def create_pptx(api_key, instruction, model_name="gpt-4o", max_tokens=4096):
try:
# Set OpenAI API key
openai.api_key = api_key
# Create OpenAI client
client = openai.OpenAI(api_key=api_key)
# Prepare messages for the chat completion
messages = [{"role": "system", "content": SYSTEM_MESSAGE}]
pptx_path = "output.pptx"
instruction_message = INSTRUCTION.replace("INSERT_INSTRUCTION_HERE", instruction)
messages.append({"role": "user", "content": instruction_message})
# Capture the directory state before execution
working_directory = os.getcwd()
files_before = list_files_in_directory(working_directory)
# Retry up to 3 times
for attempt in range(3):
try:
# Call OpenAI's GPT model
response = client.chat.completions.create(
model=model_name,
messages=messages,
max_tokens=max_tokens,
n=1,
)
generated_code = extract_code_pieces(response.choices[0].message.content, concat=True)
generated_code = generated_code.replace("from library import", "from SlidesLib import")
generated_code = generated_code.replace("generate_image(", f"generate_image({repr(api_key)},")
generated_code = "from SlidesLib import *\n\n" + generated_code
# Save the generated code
code_file = "generated_slide_code.py"
with open(code_file, "w") as f:
f.write(generated_code)
# Execute the generated code
result = subprocess.run(["python", code_file], capture_output=True, text=True, check=True)
print(result.stdout)
# Capture the directory state after execution
files_after = list_files_in_directory(working_directory)
temp_files = files_after - files_before # Identify newly created files
# Convert the pptx to jpg for preview
# preview_image = "image_previews/output.jpg"
# command = [
# "libreoffice",
# "--headless",
# "--convert-to", "jpg",
# "--outdir", "image_previews",
# pptx_path
# ]
# subprocess.run(command)
# temp_files.add(preview_image)
# If successful, return the result
return "Slide generated successfully! Download your slide below.", pptx_path
# , preview_image
except subprocess.CalledProcessError as e:
print(f"Attempt {attempt + 1} failed: {e.stderr}")
# Fallback: Use default code if all attempts fail
print("All 3 attempts failed. Running default code.")
default_code = f"""
from pptx import Presentation
ppt = Presentation()
slide = ppt.slides.add_slide(ppt.slide_layouts[5])
title = slide.shapes.title
title.text = "Insert Title Here"
content = slide.placeholders[0]
content.text = "{instruction}"
ppt.save("output.pptx")
"""
code_file = "default_slide_code.py"
with open(code_file, "w") as f:
f.write(default_code)
# Execute the default code
subprocess.run(["python", code_file], capture_output=True, text=True, check=True)
# Convert the pptx to jpg for preview
# preview_image = "image_previews/output.jpg"
# command = [
# "libreoffice",
# "--headless",
# "--convert-to", "jpg",
# "--outdir", "image_previews",
# pptx_path
# ]
# subprocess.run(command)
return "Default slide generated after 3 attempts failed.", pptx_path
except Exception as e:
return f"An error occurred: {str(e)}", None
finally:
# Cleanup temporary files
files_before.add("output.pptx")
temp_files = list_files_in_directory(working_directory) - files_before
cleanup_temp_files(temp_files)
# Create a Gradio interface
def gradio_demo(api_key, instruction):
status, pptx_path = create_pptx(api_key, instruction)
return status, pptx_path
iface = gr.Interface(
fn=gradio_demo,
inputs=[
gr.Textbox(label="OpenAI API Key", type="password"),
gr.Textbox(label="Instruction", placeholder="Enter your slide instruction here...")
],
outputs=[
gr.Textbox(label="Status"),
gr.File(label="Download Slide"),
# gr.Image(label="Slide Preview", type="filepath")
],
title="AutoPresent",
description="Automatically Generate a presentation slide"
)
iface.launch()