Spaces:

quadranttechnologies
/

Receipt_Image_Analyzer

Sleeping

Dileep7729 commited on Jan 16

Commit

7e5af81

verified ·

1 Parent(s): 235c3b6

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,26 +1,40 @@
 import gradio as gr
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
 # Load your fine-tuned model and tokenizer
 model_name = "quadranttechnologies/Receipt_Image_Analyzer"
 model = AutoModelForSequenceClassification.from_pretrained(model_name)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
-# Define a prediction function
-def analyze_receipt(receipt_text):
-    inputs = tokenizer(receipt_text, return_tensors="pt", truncation=True, padding=True)
     outputs = model(**inputs)
     logits = outputs.logits
     predicted_class = logits.argmax(-1).item()
-    return f"Predicted Class: {predicted_class}"
 # Create a Gradio interface
 interface = gr.Interface(
     fn=analyze_receipt,
-    inputs="text",
-    outputs="text",
     title="Receipt Image Analyzer",
-    description="Analyze receipts for relevant information using a fine-tuned LLM model.",
 )
 # Launch the Gradio app

 import gradio as gr
 from transformers import AutoModelForSequenceClassification, AutoTokenizer
+from PIL import Image
+import pytesseract  # Install using `pip install pytesseract` and ensure Tesseract is installed
 # Load your fine-tuned model and tokenizer
 model_name = "quadranttechnologies/Receipt_Image_Analyzer"
 model = AutoModelForSequenceClassification.from_pretrained(model_name)
 tokenizer = AutoTokenizer.from_pretrained(model_name)
+# Define a function to preprocess the image and predict
+def analyze_receipt(image):
+    # Perform OCR to extract text from the image
+    extracted_text = pytesseract.image_to_string(image)
+    # Tokenize the extracted text
+    inputs = tokenizer(extracted_text, return_tensors="pt", truncation=True, padding=True)
+    # Get model predictions
     outputs = model(**inputs)
     logits = outputs.logits
     predicted_class = logits.argmax(-1).item()
+    # Optionally return extracted text and prediction as JSON
+    result = {
+        "extracted_text": extracted_text,
+        "predicted_class": predicted_class
+    }
+    return result
 # Create a Gradio interface
 interface = gr.Interface(
     fn=analyze_receipt,
+    inputs=gr.inputs.Image(type="pil"),  # Accept image input
+    outputs="json",  # Return JSON output
     title="Receipt Image Analyzer",
+    description="Upload a receipt image to analyze and classify its contents.",
 )
 # Launch the Gradio app