Spaces:

JUNGU
/

gradio-gpt4o-RPA

Running

File size: 2,593 Bytes

6f5b327
52e7b1a
4f1688d
5cb55c0
 
 
6f5b327
1f6ea87
2775582
 
 
1f6ea87
 
5cb55c0
 
 
 
 
 
6f5b327
4f1688d
5cb55c0
 
4f1688d
 
538050d
 
9d42771
 
5cb55c0
 
 
 
 
 
 
 
9d42771
5cb55c0
 
 
 
4f1688d
 
109854c
b4b5f3c
5cb55c0
109854c
5cb55c0
4f1688d
 
 
5cb55c0
4f1688d
6f5b327
 
6838288
 
 
f6a9226
 
6838288
4f1688d
6f5b327
4f1688d
 
 
755858b
6838288
f6a9226
6f5b327
 
4f1688d

import gradio as gr
from openai import OpenAI 
import os
from PIL import Image
import base64
import io

# OpenAI 클라이언트를 API 키로 초기화( 레거시가 오류나서 새로 수정함)
api_key = os.getenv("OPENAI_API_KEY")
if api_key is None:
    raise ValueError("OPENAI_API_KEY 환경 변수가 설정되지 않았습니다.")
client = OpenAI(api_key=api_key)


def image_to_base64(image):
    buffered = io.BytesIO()
    image.save(buffered, format="JPEG")
    img_str = base64.b64encode(buffered.getvalue()).decode()
    return img_str

def extract_and_summarize(image):
    # Convert image to base64
    image_base64 = image_to_base64(image)
    
    # Prepare the prompt for GPT-4
    #여기 이미지로 된 문서가 있어. 문서를 보고 내용을 3줄로 요약해. 제출해야하는 문서의 경우 제출 기간과 방법을 반드시 포함해
    # Summarize the image document in 3 lines. If submission is needed, include the deadline, method, and link. Output in Korean
    # Summarize the image document in 3 lines. If submission details are included, add the deadline, method, and link. If there is no link, omit the link information. Output in Korean.

    prompt = [
        {
            "role": "system",
            "content": "You are a helpful assistant. Summarize the text content of the document image provided."
        },
        {
            "role": "user",
            "content": [
                {"type": "text", "text": "Summarize the image document in 3 lines. If submission details are included, add the deadline, method, and link. If there is no link, omit the link information. Output in Korean."},
                {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{image_base64}"}}
            ]
        }
    ]
    
    # Call GPT-4 API for summarization
    response = client.chat.completions.create(
        model="gpt-4o-mini",
        messages=prompt,
        temperature=0.0,
        max_tokens=300,
    )
    
    # Extract summary from GPT-4 response
    summary = response.choices[0].message.content
    
    return summary

# 샘플 문서 이미지 추가


examples = ["./sample1.png", "./sample2.png", "./sample3.png"]


# Define Gradio interface
iface = gr.Interface(
    fn=extract_and_summarize,
    inputs=gr.Image(type="pil", label="Upload Document Image"),
    outputs=gr.Textbox(label="Summarized Text"),
    title="공문서 요약 생성기",
    description="문서의 화면을 캡쳐하여 업로드하면 요약해줍니다.",
    examples=examples
)

# Launch the interface
iface.launch()