Spaces:

Hammad712
/

Urdu-OCR-APP

Sleeping

App Files Files Community

Hammad712 commited on Mar 17

Commit

23c697b

verified ·

1 Parent(s): 96f5ea0

Rename app.py to main.py

Browse files

Files changed (2) hide show

app.py +0 -59
main.py +66 -0

app.py DELETED Viewed

@@ -1,59 +0,0 @@
-import streamlit as st
-import os
-import PIL.Image
-from pdf2image import convert_from_bytes
-from google import genai
-from google.genai import types
-# Retrieve the API key from the environment variable.
-API_KEY = os.getenv("API_KEY")
-if API_KEY is None:
-    st.error("API Key not found. Please set the API_KEY environment variable.")
-    st.stop()
-# Initialize the GenAI client.
-client = genai.Client(api_key=API_KEY)
-def extract_text_from_image(img):
-    """
-    Extracts text from a PIL image using the Google GenAI API.
-    """
-    response = client.models.generate_content(
-        model="gemini-2.0-flash",
-        contents=["Extract the text from the image. Do not write anything except the extracted content", img])
-    return response.text
-st.title("PDF/Image Text Extraction using Google GenAI")
-# File uploader (accepts PDF and common image formats).
-uploaded_file = st.file_uploader("Upload a PDF or image file", type=["pdf", "png", "jpg", "jpeg", "webp"])
-if uploaded_file is not None:
-    output_text = ""
-    st.write("**Uploaded File:**", uploaded_file.name)
-    # Process PDF files.
-    if uploaded_file.name.lower().endswith(".pdf"):
-        st.info("Processing PDF file...")
-        with st.spinner("Converting PDF pages to images..."):
-            images = convert_from_bytes(uploaded_file.read(), dpi=200)
-        for idx, img in enumerate(images, start=1):
-            with st.spinner(f"Extracting text from page {idx}..."):
-                page_text = extract_text_from_image(img)
-                output_text += f"### Page {idx}\n\n{page_text}\n\n"
-    else:
-        # Process image files.
-        st.info("Processing image file...")
-        with st.spinner("Extracting text from image..."):
-            img = PIL.Image.open(uploaded_file)
-            output_text += extract_text_from_image(img) + "\n\n"
-    st.success("Extraction complete!")
-    st.markdown("### Extracted Text:")
-    st.markdown(output_text)
-    # Provide a download button for the Markdown file.
-    md_bytes = output_text.encode("utf-8")
-    st.download_button(label="Download Markdown file", data=md_bytes, file_name="output.md", mime="text/markdown")

main.py ADDED Viewed

	@@ -0,0 +1,66 @@

+import os
+import io
+import tempfile
+import PIL.Image
+from fastapi import FastAPI, File, UploadFile, HTTPException
+from fastapi.responses import FileResponse
+from pdf2image import convert_from_bytes
+from google import genai
+from google.genai import types
+app = FastAPI(title="PDF/Image Text Extraction API")
+# Retrieve the API key from an environment variable.
+API_KEY = os.getenv("API_KEY")
+if not API_KEY:
+    raise ValueError("API_KEY environment variable is not set")
+# Initialize the GenAI client.
+client = genai.Client(api_key=API_KEY)
+def extract_text_from_image(img):
+    """
+    Extracts text from a PIL image using the Google GenAI API.
+    """
+    response = client.models.generate_content(
+        model="gemini-2.0-flash",
+        contents=["Extract the text from the image. Do not write anything except the extracted content", img]
+    )
+    return response.text
+@app.post("/upload", summary="Upload a PDF or image file", response_description="Returns a Markdown file with the extracted text")
+async def upload_file(file: UploadFile = File(...)):
+    if not file.filename:
+        raise HTTPException(status_code=400, detail="No file provided")
+    # Read file content.
+    file_contents = await file.read()
+    output_text = ""
+    if file.filename.lower().endswith(".pdf"):
+        try:
+            # Convert PDF bytes to images.
+            images = convert_from_bytes(file_contents, dpi=200)
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=f"Error converting PDF: {str(e)}")
+        # Process each page.
+        for idx, img in enumerate(images, start=1):
+            page_text = extract_text_from_image(img)
+            output_text += f"### Page {idx}\n\n{page_text}\n\n"
+    else:
+        try:
+            # Process the file as an image.
+            img = PIL.Image.open(io.BytesIO(file_contents))
+        except Exception as e:
+            raise HTTPException(status_code=400, detail="Uploaded file is not a valid image")
+        output_text += extract_text_from_image(img) + "\n\n"
+    # Save the extracted text to a temporary Markdown file.
+    temp_md = tempfile.NamedTemporaryFile(delete=False, suffix=".md")
+    with open(temp_md.name, "w", encoding="utf-8") as md_file:
+        md_file.write(output_text)
+    # Return the file as a downloadable response.
+    return FileResponse(temp_md.name, filename="output.md", media_type="text/markdown")