jutor_write

Sleeping

App Files Files Community

youngtsai commited on 18 days ago

Commit

979dcbd

1 Parent(s): fed0398

def extract_text_from_image(image_input):

Browse files

Files changed (1) hide show

app.py +28 -9

app.py CHANGED Viewed

@@ -23,6 +23,9 @@ from google import genai
 from google.genai import types
 import base64
 import io
 # From other files
 from storage_service import GoogleCloudStorage
@@ -2282,19 +2285,35 @@ def download_content(content):
     return word_path
 # OCR
-def extract_text_from_image(image):
-    """從上傳的圖片中提取文字"""
-    # 檢查是否有圖片
-    if image is None:
-        return ""
-    # 將圖片轉換為 base64 編碼
     buffered = io.BytesIO()
     image.save(buffered, format="JPEG")
     img_str = base64.b64encode(buffered.getvalue()).decode()
-    # 準備圖片輸入
     image_part = types.Part.from_bytes(
         data=base64.b64decode(img_str),
         mime_type="image/jpeg",

 from google.genai import types
 import base64
 import io
+from PIL import Image
+import requests
 # From other files
 from storage_service import GoogleCloudStorage
     return word_path
 # OCR
+def extract_text_from_image(image_input):
+    """從上傳的圖片中提取文字，支援：路徑、網址、base64 字串、PIL 圖片"""
+    # 🔍 判斷輸入來源
+    if isinstance(image_input, Image.Image):
+        image = image_input
+    elif isinstance(image_input, str):
+        if image_input.startswith("http"):
+            # 網路圖片
+            response = requests.get(image_input)
+            image = Image.open(io.BytesIO(response.content)).convert("RGB")
+        elif image_input.startswith("data:image"):
+            # base64 with header
+            base64_data = image_input.split(",", 1)[1]
+            image = Image.open(io.BytesIO(base64.b64decode(base64_data))).convert("RGB")
+        elif os.path.exists(image_input):
+            # 本地圖片
+            image = Image.open(image_input).convert("RGB")
+        else:
+            # 純 base64 字串
+            image = Image.open(io.BytesIO(base64.b64decode(image_input))).convert("RGB")
+    else:
+        raise ValueError("❌ 不支援的 image 輸入格式")
+    # ✅ 圖片轉 base64
     buffered = io.BytesIO()
     image.save(buffered, format="JPEG")
     img_str = base64.b64encode(buffered.getvalue()).decode()
+    # 🧠 組成 image_part
     image_part = types.Part.from_bytes(
         data=base64.b64decode(img_str),
         mime_type="image/jpeg",