Spaces:

mashaelalbu
/

ocrsensitive

Sleeping

App Files Files Community

mashaelalbu commited on Apr 6

Commit

1d79ca2

verified ·

1 Parent(s): f726507

Update app/utils.py

Browse files

Files changed (1) hide show

app/utils.py +49 -70

app/utils.py CHANGED Viewed

@@ -1,4 +1,4 @@
-# utils.py
 import os
 import pandas as pd
 from transformers import AutoModel, AutoTokenizer
@@ -13,11 +13,6 @@ from flask import current_app
 import base64
 logger = logging.getLogger(__name__)
-FIXED_ALLERGENS = [
-    "dairy", "eggs", "peanuts", "soy",
-    "tree nuts", "wheat", "fish",
-    "shellfish", "sesame"
-]
 class OCRModel:
     _instance = None
@@ -150,6 +145,46 @@ class AllergyAnalyzer:
                 results.append(allergy)
         return results
     def analyze_image(self, image, user_allergens, claude_api_key=None):
         """تحليل الصورة مباشرة للكشف عن الحساسيات"""
         try:
@@ -175,19 +210,15 @@ class AllergyAnalyzer:
                         database_matches[allergy].append(token)
                 elif claude_api_key:
                     # إذا لم توجد في قاعدة البيانات، نستخدم Claude API
-                    claude_results = []
                     for allergy in user_allergens:
-                        if self.check_claude_allergens(token, allergy, claude_api_key, image):
-                            claude_results.append(allergy)
-                    if claude_results:
-                        for allergy in claude_results:
                             detected_allergens.add(allergy)
                             if allergy not in claude_matches:
                                 claude_matches[allergy] = []
                             claude_matches[allergy].append(token)
             return {
                 "detected_allergens": list(detected_allergens),
                 "database_matches": database_matches,
                 "claude_matches": claude_matches,
@@ -197,65 +228,13 @@ class AllergyAnalyzer:
         except Exception as e:
             logger.error(f"Error analyzing image: {str(e)}", exc_info=True)
             return {
                 "detected_allergens": [],
                 "database_matches": {},
                 "claude_matches": {},
-                "analyzed_tokens": [],
-                "error": str(e)
             }
-    def check_claude_allergens(self, token, allergy, api_key, image):
-        """الاستعلام من Claude API عن الحساسيات"""
-        try:
-            # تحضير الصورة للطلب
-            img_byte_arr = io.BytesIO()
-            image.save(img_byte_arr, format='JPEG')
-            img_byte_arr = img_byte_arr.getvalue()
-            prompt = f"""
-    Analyze if this product contains or is derived from {allergy}.
-    Focus on the ingredient: {token}.
-    Respond ONLY with 'Yes' or 'No'. No explanations.
-    """
-            url = "https://api.anthropic.com/v1/messages"
-            headers = {
-                "x-api-key": api_key,
-                "content-type": "application/json",
-                "anthropic-version": "2023-06-01"
-            }
-            data = {
-                "model": "claude-3-opus-20240229",
-                "messages": [
-                    {
-                        "role": "user",
-                        "content": [
-                            {
-                                "type": "image",
-                                "source": {
-                                    "type": "base64",
-                                    "media_type": "image/jpeg",
-                                    "data": base64.b64encode(img_byte_arr).decode('utf-8')
-                                }
-                            },
-                            {
-                                "type": "text",
-                                "text": prompt
-                            }
-                        ]
-                    }
-                ],
-                "max_tokens": 10
-            }
-            response = requests.post(url, json=data, headers=headers)
-            json_response = response.json()
-            if "content" in json_response and isinstance(json_response["content"], list):
-                return json_response["content"][0]["text"].strip().lower() == 'yes'
-            return False
-        except Exception as e:
-            logger.error(f"Error querying Claude API: {str(e)}")
-            return False

+# utils.py (معدل)
 import os
 import pandas as pd
 from transformers import AutoModel, AutoTokenizer
 import base64
 logger = logging.getLogger(__name__)
 class OCRModel:
     _instance = None
                 results.append(allergy)
         return results
+    def check_allergy_risk(self, ingredient, allergy_type, api_key):
+        """الاستعلام من Claude API عن الحساسيات"""
+        prompt = f"""
+You are a professional food safety expert specializing in allergen classification and risk assessment. Your task is critical because allergic reactions to {allergy_type} can be severe or even life-threatening.
+Please analyze the ingredient '{ingredient}' and determine whether it contains or is derived from {allergy_type}, posing a potential allergy risk for individuals with {allergy_type} allergies.
+⚠️ *Important Guidelines:*
+- Base your answer strictly on scientific classification and allergen presence.
+- Do NOT rely solely on word similarity—consider actual ingredient composition.
+- If '{ingredient}' contains {allergy_type} proteins or poses a high cross-allergy risk, answer *'Yes'*.
+- If it is completely unrelated and safe for individuals with {allergy_type} allergies, answer *'No'*.
+🚨 *Final Answer:* Only respond with *'Yes'* or *'No'*. Do NOT provide explanations.
+"""
+        url = "https://api.anthropic.com/v1/messages"
+        headers = {
+            "x-api-key": api_key,
+            "content-type": "application/json",
+            "anthropic-version": "2023-06-01"
+        }
+        data = {
+            "model": "claude-3-opus-20240229",
+            "messages": [{"role": "user", "content": prompt}],
+            "max_tokens": 10
+        }
+        try:
+            response = requests.post(url, json=data, headers=headers)
+            json_response = response.json()
+            if "content" in json_response and isinstance(json_response["content"], list):
+                return json_response["content"][0]["text"].strip().lower() == 'yes'
+            return False
+        except Exception as e:
+            logger.error(f"Error querying Claude API: {str(e)}")
+            return False
     def analyze_image(self, image, user_allergens, claude_api_key=None):
         """تحليل الصورة مباشرة للكشف عن الحساسيات"""
         try:
                         database_matches[allergy].append(token)
                 elif claude_api_key:
                     # إذا لم توجد في قاعدة البيانات، نستخدم Claude API
                     for allergy in user_allergens:
+                        if self.check_allergy_risk(token, allergy, claude_api_key):
                             detected_allergens.add(allergy)
                             if allergy not in claude_matches:
                                 claude_matches[allergy] = []
                             claude_matches[allergy].append(token)
             return {
+                "extracted_text": extracted_text,
                 "detected_allergens": list(detected_allergens),
                 "database_matches": database_matches,
                 "claude_matches": claude_matches,
         except Exception as e:
             logger.error(f"Error analyzing image: {str(e)}", exc_info=True)
             return {
+                "error": str(e),
                 "detected_allergens": [],
                 "database_matches": {},
                 "claude_matches": {},
+                "analyzed_tokens": []
             }
+    def get_allergen_list(self):
+        """الحصول على قائمة الحساسيات المعروفة"""
+        return list(self.allergy_dict.keys())