math-exams-symvp-duo

Sleeping

App Files Files Community

joshuarauh commited on Feb 5

Commit

1a27daf

verified ·

1 Parent(s): 5fc9baf

Update app.py

Browse files

Files changed (1) hide show

app.py +146 -1

app.py CHANGED Viewed

@@ -24,6 +24,11 @@ anthropic = Anthropic(
     api_key=os.environ.get('ANTHROPIC_API_KEY')
 )
 # Request tracking
 MAX_REQUESTS_PER_DAY = 500
 request_history = deque(maxlen=1000)
@@ -509,6 +514,136 @@ The computation question MAY NOT:
     }
     return problem_type_additions.get(question_type, "")
 def generate_question(subject, difficulty, question_type, use_enhancement=False):
     """Generate a single math question with additional verification"""
     try:
@@ -552,7 +687,8 @@ def generate_question(subject, difficulty, question_type, use_enhancement=False)
         system_prompt = f"""You are an expert mathematics professor creating a {difficulty_params['description']} exam question.
 STRICT REQUIREMENTS:
 1. Write exactly 1 {question_type} question on {subject} covering {selected_topic} that can be solved analytically without numerical methods.
-   A question where any part of the solution must resort to numerical methdos is invalid.
 2. Difficulty Level Guidelines:
    {difficulty_params['description'].upper()}
    Follow these specific constraints:
@@ -570,6 +706,7 @@ STRICT REQUIREMENTS:
    - When writing questions involving currency expressed in dollars NEVER use the `$` symbol as it will be interepreted as math mode. ALWAYS write out the word dollars.
       * Example: 1000 dollars
 5. Include a detailed solution
    - If the question involves geometry make sure to identify any general geometric formulas that apply, For example:
         * Areas/volumes of common shapes and solids
         * Cross-sectional areas of geometric figures
@@ -676,6 +813,14 @@ j. **Concluding and Intuitive Explanations**
                     final_verification = perform_final_verification(revised_solution, sympy_correct)
                     response_text += "\n\nFinal Expert Verification:\n" + final_verification
         # Create LaTeX content
         questions_latex = create_latex_document(response_text, questions_only=True)
         full_latex = create_latex_document(response_text, questions_only=False)

     api_key=os.environ.get('ANTHROPIC_API_KEY')
 )
+openai.api_key = os.getenv("My_MathTest_key")
+if openai.api_key is None:
+    raise ValueError("OpenAI API key not found.")
 # Request tracking
 MAX_REQUESTS_PER_DAY = 500
 request_history = deque(maxlen=1000)
     }
     return problem_type_additions.get(question_type, "")
+def get_solution_for_verification(response_text, sympy_correct, final_verification=None):
+    """
+    Extract the relevant parts of the solution for verification based on whether
+    the original solution was correct or not. Always preserves the original question.
+    """
+    # Extract the question using the specific markers
+    question_start = "Here is a test question"
+    solution_start = "Here is a detailed solution to the test question"
+    # Find the question section
+    q_start = response_text.find(question_start)
+    q_end = response_text.find(solution_start)
+    if q_start == -1 or q_end == -1:
+        logger.error("Could not find question markers")
+        return response_text.strip()
+    question = response_text[q_start:q_end].strip()
+    # If no sympy verification was done, treat as correct and use original
+    if sympy_correct is None:
+        sympy_correct = True
+    if sympy_correct:
+        # Use original solution - need to extract before SymPy code
+        original_solution = parts[1]
+        sympy_start = original_solution.find('```python')
+        if sympy_start != -1:
+            solution = original_solution[:sympy_start].strip()
+        else:
+            solution = original_solution.strip()
+    else:
+        # Use final verified solution
+        if final_verification:
+            # Extract the solution after the marker
+            marker = "Here is the complete verified solution:"
+            if marker in final_verification:
+                solution = final_verification.split(marker)[1].strip()
+            else:
+                # Fallback to using the whole verification text
+                solution = final_verification.strip()
+        else:
+            # Fallback to original if no final verification
+            solution = parts[1].strip()
+    # Combine question and appropriate solution
+    complete_text = f"{question}\n\nSolution:\n{solution}"
+    return complete_text
+def verify_with_chatgpt(question_and_solution):
+    """
+    Send the solution to ChatGPT for verification and grading.
+    Returns the verification response.
+    """
+    try:
+        # Construct the prompt for ChatGPT
+        verification_prompt = f"""As an expert mathematician, please verify and grade this mathematics solution.
+Analyze the following aspects:
+1. Mathematical Correctness (50 points):
+   - Are all calculations correct?
+   - Are proofs logically sound?
+   - Are all steps properly justified?
+2. Completeness (20 points):
+   - Are all necessary cases considered?
+   - Are edge cases addressed?
+   - Are all required steps shown?
+3. Clarity and Presentation (20 points):
+   - Is the solution well-organized?
+   - Are steps clearly explained?
+   - Is mathematical notation used correctly?
+4. Mathematical Sophistication (10 points):
+   - Is the approach elegant?
+   - Are efficient methods used?
+   - Is mathematical insight demonstrated?
+Question and Solution to Verify:
+{question_and_solution}
+Please provide:
+1. A brief point-by-point analysis of the solution
+2. Specific comments on any errors or oversights
+3. Suggestions for improvement (if any)
+4. A numerical score out of 100 based on the criteria above
+Format your response with clear headers and bullet points."""
+        # Call OpenAI API
+        response = openai.ChatCompletion.create(
+            model="gpt-4o",  # Using GPT-4o model
+            messages=[
+                {"role": "system", "content": "You are an expert mathematics professor grading student solutions."},
+                {"role": "user", "content": verification_prompt}
+            ],
+            temperature=0.3
+        )
+        # Extract the verification text from the response
+        verification_text = response.choices[0].message.content
+        return verification_text
+    except Exception as e:
+        logger.error(f"Error in ChatGPT verification: {str(e)}")
+        return f"Error in ChatGPT verification: {str(e)}"
+def append_chatgpt_verification(initial_response, sympy_correct, final_verification=None):
+    """
+    Main function to handle the ChatGPT verification process.
+    Returns the original response with the ChatGPT verification appended.
+    """
+    try:
+        # Get the appropriate solution text for verification
+        solution_text = get_solution_for_verification(initial_response, sympy_correct, final_verification)
+        # Get ChatGPT's verification
+        chatgpt_verification = verify_with_chatgpt(solution_text)
+        # Append verification to the response
+        full_response = f"{initial_response}\n\nChatGPT Verification and Grading:\n{chatgpt_verification}"
+        return full_response
+    except Exception as e:
+        logger.error(f"Error in verification process: {str(e)}")
+        return initial_response + f"\n\nError in ChatGPT verification: {str(e)}"
 def generate_question(subject, difficulty, question_type, use_enhancement=False):
     """Generate a single math question with additional verification"""
     try:
         system_prompt = f"""You are an expert mathematics professor creating a {difficulty_params['description']} exam question.
 STRICT REQUIREMENTS:
 1. Write exactly 1 {question_type} question on {subject} covering {selected_topic} that can be solved analytically without numerical methods.
+   - A question where any part of the solution must resort to numerical methods is invalid.
+   - Begin the output with the text "Here is a test question that is a {question_type} question on {subject} covering {selected_topic}."
 2. Difficulty Level Guidelines:
    {difficulty_params['description'].upper()}
    Follow these specific constraints:
    - When writing questions involving currency expressed in dollars NEVER use the `$` symbol as it will be interepreted as math mode. ALWAYS write out the word dollars.
       * Example: 1000 dollars
 5. Include a detailed solution
+   - Begin the solution with "Here is a detailed solution to the test question."
    - If the question involves geometry make sure to identify any general geometric formulas that apply, For example:
         * Areas/volumes of common shapes and solids
         * Cross-sectional areas of geometric figures
                     final_verification = perform_final_verification(revised_solution, sympy_correct)
                     response_text += "\n\nFinal Expert Verification:\n" + final_verification
+        # add the ChatGPT verification
+        if sympy_output:
+            response_text = append_chatgpt_verification(
+                response_text,
+                sympy_correct,
+                final_verification if has_discrepancy else None
+            )
         # Create LaTeX content
         questions_latex = create_latex_document(response_text, questions_only=True)
         full_latex = create_latex_document(response_text, questions_only=False)