Spaces:
Sleeping
Sleeping
Update main.py
Browse files
main.py
CHANGED
@@ -67,6 +67,17 @@ def receipt_radar_prompt(raw_text:str)->str:
|
|
67 |
travel_type(bus,train,airplane,taxi,bike,rickshaw classify in these categories only strictly),travel_company_name , departure_destination , arrival_destination , arrival_city(if you are not able to find the arrival city add the arrival destination into this field strictly. ), departure_date,arrival_date .If the arrival and departure dates are the same from receipt text given to you analyse it properly to check that, then only use the same date in both the fields .if you don't find any field mark it as null.
|
68 |
"""
|
69 |
hotel_data_points = """ hotel_type(hotel_stay , dine_in , dine_in + stay(use both keyword strictly)), hotel_brand_name , hotel_location , hotel_checkin_date , hotel_checkout_date. if you don't find any field mark it as null """
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
70 |
system_prompt = f"""Extract information from the following receipt OCR text and return a JSON object with these exact keys: brand, total_cost, location, purchase_category, brand_category, Date, currency, filename, payment_method, metadata.
|
71 |
Rules:
|
72 |
1. For total_cost, use the highest monetary value in the text.
|
@@ -75,11 +86,12 @@ def receipt_radar_prompt(raw_text:str)->str:
|
|
75 |
4. metadata: For insurance receipts extract the data points given in the JSON and return the JSON with structure: \n """ + insurance_response_structure + """
|
76 |
5.metadata : For travel receipts(flight ,bus,train) extract these data points as a JSON object exactly""" + travel_response_structure + """
|
77 |
6. metadata : For hotel receipts extract these data points as a JSON object exactly""" + hotel_data_points + f"""
|
|
|
78 |
For non-insurance and non-travel , non-hotel receipts, return metadata as null.
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
|
83 |
Ensure the strictly that output is a valid JSON object containing strictly the above keys, without any explanations.
|
84 |
Here's the OCR text below analyse it and convert into json using keys provided in first line and using the rules provided in rules section:
|
85 |
Generate a JSON response in the following format without using the ```json block. Ensure the output is properly formatted as plain text JSON.
|
|
|
67 |
travel_type(bus,train,airplane,taxi,bike,rickshaw classify in these categories only strictly),travel_company_name , departure_destination , arrival_destination , arrival_city(if you are not able to find the arrival city add the arrival destination into this field strictly. ), departure_date,arrival_date .If the arrival and departure dates are the same from receipt text given to you analyse it properly to check that, then only use the same date in both the fields .if you don't find any field mark it as null.
|
68 |
"""
|
69 |
hotel_data_points = """ hotel_type(hotel_stay , dine_in , dine_in + stay(use both keyword strictly)), hotel_brand_name , hotel_location , hotel_checkin_date , hotel_checkout_date. if you don't find any field mark it as null """
|
70 |
+
coupon_data_points = """
|
71 |
+
{
|
72 |
+
"brand_name": "Extract the brand_name from where the coupon is sent",
|
73 |
+
"validity": {
|
74 |
+
"start_date": "Date the coupon is valid from, if provided.other wise mark it as null",
|
75 |
+
"expiration_date": "Date the coupon expires. Leave blank if not mentioned."
|
76 |
+
},
|
77 |
+
"coupon_code": "Extract the unique code found in the email. If unavailable, leave it blank.",
|
78 |
+
"description": "Provide the discount details (amount/percentage), minimum purchase, eligible products, retailer, any terms or restrictions, usage limit (single-use/multi-use), and where the coupon applies (in-store/online)."
|
79 |
+
}
|
80 |
+
"""
|
81 |
system_prompt = f"""Extract information from the following receipt OCR text and return a JSON object with these exact keys: brand, total_cost, location, purchase_category, brand_category, Date, currency, filename, payment_method, metadata.
|
82 |
Rules:
|
83 |
1. For total_cost, use the highest monetary value in the text.
|
|
|
86 |
4. metadata: For insurance receipts extract the data points given in the JSON and return the JSON with structure: \n """ + insurance_response_structure + """
|
87 |
5.metadata : For travel receipts(flight ,bus,train) extract these data points as a JSON object exactly""" + travel_response_structure + """
|
88 |
6. metadata : For hotel receipts extract these data points as a JSON object exactly""" + hotel_data_points + f"""
|
89 |
+
7. metadata : For coupon receipts extract these data points as a JSON object exactly""" + coupon_data_points + f"""
|
90 |
For non-insurance and non-travel , non-hotel receipts, return metadata as null.
|
91 |
+
8. Use currency codes (e.g., USD, EUR) instead of symbols.
|
92 |
+
9. Generate filename as 'PURCHASE_TYPE_BRAND_DATE' (e.g., 'clothing_gucci_20230715').
|
93 |
+
10. If a value is not found, return null.
|
94 |
+
11. If all values are null, return null.
|
95 |
Ensure the strictly that output is a valid JSON object containing strictly the above keys, without any explanations.
|
96 |
Here's the OCR text below analyse it and convert into json using keys provided in first line and using the rules provided in rules section:
|
97 |
Generate a JSON response in the following format without using the ```json block. Ensure the output is properly formatted as plain text JSON.
|