Every-Text

Running

App Files Files Community

ginipick commited on Mar 18

Commit

e48aa5a

verified ·

1 Parent(s): f09c591

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -11

app.py CHANGED Viewed

@@ -6,6 +6,7 @@ import uuid
 import base64
 import mimetypes
 import json
 import torch
 from safetensors.torch import load_file
@@ -19,6 +20,9 @@ from diffusers import FluxPipeline
 from google import genai
 from google.genai import types
 #######################################
 # 0. 환경설정
 #######################################
@@ -34,7 +38,7 @@ os.environ["HF_HOME"] = CACHE_PATH
 # (예시) Google GenAI 사용:
 # export GAPI_TOKEN="<YOUR_GOOGLE_GENAI_API_KEY>"
-# 작업 시간 측정을 위한 간단한 타이머 클래스
 class timer:
     def __init__(self, method_name="timed process"):
         self.method = method_name
@@ -164,7 +168,6 @@ def generate_initial_image(prompt, text, height, width, steps, scale, seed):
     prompt: 이미지 배경/장면/스타일 묘사를 위한 프롬프트
     text: 실제로 이미지에 들어가야 할 문구(예: "안녕하세요", "Hello world" 등)
     """
-    # Diffusion 모델에 "이미지 안에 텍스트를 표시하라"는 요청을 넣기 위해
     combined_prompt = f"{prompt} with clear readable text that says '{text}'"
     with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"):
@@ -186,29 +189,32 @@ def change_text_in_image(original_image, new_text):
     업로드된 이미지 내부의 문구를 `new_text`로 변경해주는 함수.
     """
     try:
-        # 임시 파일에 먼저 저장
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             original_path = tmp.name
             original_image.save(original_path)
-        # Gemini 모델 호출
         image_path, text_response = generate_by_google_genai(
             text=f"Change the text in this image to: '{new_text}'",
             file_name=original_path
         )
-        # 결과가 이미지로 왔다면
         if image_path:
-            modified_img = gr.processing_utils.decode_base64_to_image(
-                base64.b64encode(open(image_path, "rb").read())
-            )
-            return modified_img, ""  # (결과 이미지, 빈 텍스트)
         else:
-            # 이미지가 없이 텍스트만 응답으로 온 경우
             return None, text_response
     except Exception as e:
-        # Gradio 에러 표시를 위해 gr.Error를 사용
         raise gr.Error(f"Error: {e}")

 import base64
 import mimetypes
 import json
+import io
 import torch
 from safetensors.torch import load_file
 from google import genai
 from google.genai import types
+# PIL 이미지 처리를 위해 추가
+from PIL import Image
 #######################################
 # 0. 환경설정
 #######################################
 # (예시) Google GenAI 사용:
 # export GAPI_TOKEN="<YOUR_GOOGLE_GENAI_API_KEY>"
+# 간단한 타이머 클래스
 class timer:
     def __init__(self, method_name="timed process"):
         self.method = method_name
     prompt: 이미지 배경/장면/스타일 묘사를 위한 프롬프트
     text: 실제로 이미지에 들어가야 할 문구(예: "안녕하세요", "Hello world" 등)
     """
     combined_prompt = f"{prompt} with clear readable text that says '{text}'"
     with torch.inference_mode(), torch.autocast("cuda", dtype=torch.bfloat16), timer("inference"):
     업로드된 이미지 내부의 문구를 `new_text`로 변경해주는 함수.
     """
     try:
+        # 이미지를 임시 파일로 저장
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tmp:
             original_path = tmp.name
             original_image.save(original_path)
+        # Gemini 모델 호출하여 텍스트 변경
         image_path, text_response = generate_by_google_genai(
             text=f"Change the text in this image to: '{new_text}'",
             file_name=original_path
         )
+        # 결과가 이미지로 반환된 경우
         if image_path:
+            # Gradio 구버전(4.26.0 이하)에는 decode_base64_to_image가 없으므로 PIL을 직접 사용
+            with open(image_path, "rb") as f:
+                image_data = f.read()
+            # base64를 거치지 않고, PIL Image로 디코딩
+            modified_img = Image.open(io.BytesIO(image_data))
+            return modified_img, ""
         else:
+            # 이미지 없이 텍스트만 응답으로 온 경우
             return None, text_response
     except Exception as e:
         raise gr.Error(f"Error: {e}")