testing-groq

Sleeping

App Files Files Community

khurrameycon commited on Dec 2, 2024

Commit

db40c74

verified ·

1 Parent(s): fddb1a0

prompt improved

Browse files

Files changed (1) hide show

app.py +70 -7

app.py CHANGED Viewed

@@ -214,7 +214,47 @@ PROMPT_SKILLS = (
 )
-PROMPT_IMAGE = (
     "You are a highly intelligent assistant designed to analyze images and extract structured information from them. "
     "Your task is to analyze the given image of a student's academic record and generate a response in the exact JSON format provided below. "
     "If any specific information is missing or unavailable in the image, replace the corresponding field with null. "
@@ -229,7 +269,23 @@ PROMPT_IMAGE = (
     '    "cumulative_gpa": "string",\n'
     '    "program": "string",\n'
     '    "status": "string"\n'
-    '  },\n'
     '  "courses": [\n'
     '    {\n'
     '      "transfer_institution": "string",\n'
@@ -246,14 +302,15 @@ PROMPT_IMAGE = (
     "  ]\n"
     "}\n\n"
     "Instructions:\n\n"
-    "1. Extract the student information and course details as displayed in the image.\n"
     "2. Use null for any missing or unavailable information.\n"
     "3. Format the extracted data exactly as shown above. Do not deviate from this structure.\n"
-    "4. Use accurate field names and ensure proper nesting of data (e.g., 'student' and 'courses' sections).\n"
-    "5. The values for numeric fields like credits_attempted, credits_earned, and quality_points should be numbers (not strings).\n"
 )
 @app.route("/", methods=["GET"])
 def home():
     return jsonify({"message": "Welcome to the PDF Extraction API. Use the /extract endpoint to extract information."})
@@ -287,10 +344,16 @@ def extract_info():
             response_skills = ''
         if data["img_url"] is not None:
-            prompt_skills = f"{PROMPT_IMAGE}\n"
             img_url = data["img_url"]
             file_pref = data["file_pref"]
-            response_image = predict_image(img_url, prompt_skills, file_pref)
         else:
             response_image = ''

 )
+# PROMPT_IMAGE = (
+#     "You are a highly intelligent assistant designed to analyze images and extract structured information from them. "
+#     "Your task is to analyze the given image of a student's academic record and generate a response in the exact JSON format provided below. "
+#     "If any specific information is missing or unavailable in the image, replace the corresponding field with null. "
+#     "Ensure the format is consistent, strictly adhering to the structure shown below.\n\n"
+#     "Required JSON Format:\n\n"
+#     "{\n"
+#     '  "student": {\n'
+#     '    "name": "string",\n'
+#     '    "id": "string",\n'
+#     '    "dob": "string",\n'
+#     '    "original_start_date": "string",\n'
+#     '    "cumulative_gpa": "string",\n'
+#     '    "program": "string",\n'
+#     '    "status": "string"\n'
+#     '  },\n'
+#     '  "courses": [\n'
+#     '    {\n'
+#     '      "transfer_institution": "string",\n'
+#     '      "course_code": "string",\n'
+#     '      "course_name": "string",\n'
+#     '      "credits_attempted": number,\n'
+#     '      "credits_earned": number,\n'
+#     '      "grade": "string",\n'
+#     '      "quality_points": number,\n'
+#     '      "semester_code": "string",\n'
+#     '      "semester_dates": "string"\n'
+#     '    }\n'
+#     "    // Additional courses can be added here\n"
+#     "  ]\n"
+#     "}\n\n"
+#     "Instructions:\n\n"
+#     "1. Extract the student information and course details as displayed in the image.\n"
+#     "2. Use null for any missing or unavailable information.\n"
+#     "3. Format the extracted data exactly as shown above. Do not deviate from this structure.\n"
+#     "4. Use accurate field names and ensure proper nesting of data (e.g., 'student' and 'courses' sections).\n"
+#     "5. The values for numeric fields like credits_attempted, credits_earned, and quality_points should be numbers (not strings).\n"
+# )
+PROMPT_IMAGE_STUDENT = (
     "You are a highly intelligent assistant designed to analyze images and extract structured information from them. "
     "Your task is to analyze the given image of a student's academic record and generate a response in the exact JSON format provided below. "
     "If any specific information is missing or unavailable in the image, replace the corresponding field with null. "
     '    "cumulative_gpa": "string",\n'
     '    "program": "string",\n'
     '    "status": "string"\n'
+    '  }\n'
+    "}\n\n"
+    "Instructions:\n\n"
+    "1. Extract the student's general information as displayed in the image.\n"
+    "2. Use null for any missing or unavailable information.\n"
+    "3. Format the extracted data exactly as shown above. Do not deviate from this structure.\n"
+    "4. Ensure accurate field names and proper nesting.\n"
+    "5. Return only the 'student' section as JSON.\n"
+)
+PROMPT_IMAGE_COURSES = (
+    "You are a highly intelligent assistant designed to analyze images and extract structured information from them. "
+    "Your task is to analyze the given image of a student's academic record and generate a response in the exact JSON format provided below. "
+    "If any specific information is missing or unavailable in the image, replace the corresponding field with null. "
+    "Ensure the format is consistent, strictly adhering to the structure shown below.\n\n"
+    "Required JSON Format:\n\n"
+    "{\n"
     '  "courses": [\n'
     '    {\n'
     '      "transfer_institution": "string",\n'
     "  ]\n"
     "}\n\n"
     "Instructions:\n\n"
+    "1. Extract the course details as displayed in the image.\n"
     "2. Use null for any missing or unavailable information.\n"
     "3. Format the extracted data exactly as shown above. Do not deviate from this structure.\n"
+    "4. Ensure accurate field names and proper nesting.\n"
+    "5. Return only the 'courses' section as JSON.\n"
 )
 @app.route("/", methods=["GET"])
 def home():
     return jsonify({"message": "Welcome to the PDF Extraction API. Use the /extract endpoint to extract information."})
             response_skills = ''
         if data["img_url"] is not None:
+            prompt_student = f"{PROMPT_IMAGE_STUDENT}\n"
+            prompt_courses = f"{PROMPT_IMAGE_COURSES}\n"
             img_url = data["img_url"]
             file_pref = data["file_pref"]
+            response_student = predict_image(img_url, prompt_student, file_pref)
+            response_courses = predict_image(img_url, prompt_courses, file_pref)
+            # response_image = response_student + response_courses
+            response_image = {"student": response_student.get("student", {}), "courses": response_courses.get("courses", [])}
         else:
             response_image = ''