Spaces:

sarim
/

ppt

Running

ppt

File size: 3,283 Bytes

5d14cc6
50d1ce2
4ba3023
ec1c0d9
 
 
 
 
d553fab
ec1c0d9
a8e9d4c
ec1c0d9
 
03b4c19
ec1c0d9
 
a8e9d4c
 
ec1c0d9
 
2afa0ec
c5224f2
 
2afa0ec
 
5d14cc6
d553fab
3745704
d553fab
5d14cc6
a8e9d4c
75fbe45
bd94ab4
c276872
5d14cc6
 
bd94ab4
599d94c
 
 
 
823af88
6eb7a8a
03b4c19
 
1ddd219
a8e9d4c
5d14cc6
c5224f2
 
 
c276872
50d1ce2
 
 
 
 
2afa0ec
03b4c19
d5a88b1
60e8e5d
d5a88b1
60e8e5d
5d14cc6
 
 
 
 
ec1c0d9
 
86551a1
ec1c0d9
 
4f86a6f
c5224f2
ec1c0d9
 
a91875b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a5f868b
ec1c0d9
 
4ba3023

import asyncio
from pydantic_ai.result import ResultData, RunResult
import streamlit as st
from pydantic_ai import Agent
from pydantic_ai.models.groq import GroqModel
import nest_asyncio
import pdfplumber
import os
import presentation as customClass


api_key = os.getenv("API_KEY")
data = []
last_message = ''




model = GroqModel('llama-3.1-70b-versatile', api_key = api_key)

def split_long_string(long_string, chunk_size=6000):
    string_data =  "".join(long_string)
    return [string_data[i:i+chunk_size] for i in range(0, len(string_data), chunk_size)]


async def ppt_content(data):
    agent = Agent(model,
    result_type=customClass.PPT,
    system_prompt=(
        "You are an expert in making power-point perssentation",
        "Create 6 sliders",
        "Title Slide: short into about the presentation",
        "Methodology Slide: Summarize the methodology in detail",
        "Results Slide: Present key findings in detail in simple text and bullet points.",
        "Discussion Slide: Summarize the implications and limitations.",
        "Conclusion Slide: State the overall conclusion.",
        "Reference Slide: Include all citations used.",
        "Each slide should be seperate",
        "Each slide should have 4 parts :"
        "1. Title : title of the slide ",
        "2. Text: he detailed description or narrative content of the slide. This should include key information, explanations, or supporting arguments. Keep it concise yet informative to avoid overwhelming the audience.",
        "3. Bullet point: A list of bullet points summarizing key information on the slide. Each bullet point should be detail, long, and highlight a specific aspect of the slide's topic. ideally, limit to 3-5 points.",
        "4. Image Suggestion: A prompt for generating an image to complement the slide content. Describe the desired visual in detail, including elements, style, and relevance to the topic. Ensure the prompt is actionable for AI tools.",
        "Below is the text extracted from pdf",
        "".join(data)
        
        
    ))
    listOfString = split_long_string(data)
    for i, chunk in enumerate(listOfString, 1):
        print(f"Chunk {i}:\n{chunk}\n")

    # for x in listOfString:
    #     result: RunResult[str] = RunResult(_all_messages:[])
    #     result = agent.run_sync(user_prompt = x,message_history = result.new_messages())
    
    
    
    result_1 = agent.run_sync(user_prompt = "Create content for presentation and pdf extracted text is in 'system_prompt'")
    #result_2 = agent.run_sync(user_prompt = listOfString[1],message_history=result_1.new_messages())
    
    print(result_1.data)
    

def ai_ppt(data):
    asyncio.run(ppt_content(data=data))


def extract_data(feed):
    
    with pdfplumber.open(feed) as pdf:
        pages = pdf.pages
        for p in pages:
            data.append(p.extract_text())
        print(data)
    return None 



# if data is not None:
#     st.caption(data)
#     ai_ppt(data=data)

def main():
    uploaded_file = st.file_uploader('Choose your .pdf file', type="pdf")
    if uploaded_file is not None:
        extract_data(uploaded_file)
    if st.button("Search"):
        ai_ppt(data)

if __name__ == '__main__':
    import asyncio
    nest_asyncio.apply()
    main()