math-exams-symvp-duo

Sleeping

App Files Files Community

joshuarauh commited on Jan 12

Commit

7983613

verified ·

1 Parent(s): fbc3848

Update app.py

Browse files

Files changed (1) hide show

app.py +50 -16

app.py CHANGED Viewed

@@ -605,7 +605,10 @@ def check_and_resolve_discrepancy(initial_response, sympy_output):
         If the two answers are inconsistent with each other then please:
         1. Identify which solution is correct
         2. Explain the error in the incorrect solution
-        3. Provide a revised complete solution that fixes any errors and does not refer to SymPy
 Original solution:
 {initial_response}
@@ -634,26 +637,58 @@ Please maintain the same LaTeX formatting as the original solution."""
             resolution_text += "\n\nNew SymPy Verification Results:\n```\n" + new_sympy_output + "\n```"
         # Determine if there was a discrepancy that required a revised solution
-        # First check if there's an inconsistency mentioned
-        has_discrepancy = "inconsistent" in resolution_text.lower() or "inconsistency" in resolution_text.lower()
-        # Look for the exact phrase we required in the prompt
         revised_solution = None
         if has_discrepancy:
-            marker = "Here is the revised complete solution:"
-            parts = resolution_text.split(marker, maxsplit=1)
-            if len(parts) > 1:
-                revised_solution = parts[1].strip()
             if not revised_solution:
-                # Fallback check for common revision phrases
-                revision_phrases = ["revised complete solution:", "revised solution:", "correct solution:", "corrected solution:"]
-                for phrase in revision_phrases:
-                    if phrase in resolution_text.lower():
-                        parts = resolution_text.split(phrase, maxsplit=1)
                         if len(parts) > 1:
                             revised_solution = parts[1].strip()
-                            break
         return resolution_text, has_discrepancy, revised_solution
@@ -712,8 +747,7 @@ Please ensure any corrected solution maintains proper LaTeX formatting with $ fo
     except Exception as e:
         logger.error(f"Error in final verification: {str(e)}")
         return f"Error in final verification: {str(e)}"
 # Create Gradio interface
 with gr.Blocks() as interface:
     gr.Markdown("# Advanced Mathematics Question Generator")

         If the two answers are inconsistent with each other then please:
         1. Identify which solution is correct
         2. Explain the error in the incorrect solution
+        3. Write "Here is the revised complete solution:" and then write out the ENTIRE solution from beginning
+           to end, including all parts that were correct and the corrections for any incorrect parts.
+           Do not refer to the original solution or say things like "the rest remains the same" - write
+           out everything in full.
 Original solution:
 {initial_response}
             resolution_text += "\n\nNew SymPy Verification Results:\n```\n" + new_sympy_output + "\n```"
         # Determine if there was a discrepancy that required a revised solution
+        # Check for any indication of inconsistency or error
+        inconsistency_phrases = [
+            "inconsistent", "inconsistency", "incorrect", "error", "wrong",
+            "differs", "different", "discrepancy", "mistaken", "mistake"
+        ]
+        has_discrepancy = any(phrase in resolution_text.lower() for phrase in inconsistency_phrases)
+        # Look for the required marker phrase and extract the solution after it
+        marker = "Here is the revised complete solution:"
         revised_solution = None
         if has_discrepancy:
+            # Split at the marker
+            if marker in resolution_text:
+                parts = resolution_text.split(marker, maxsplit=1)
+                if len(parts) > 1:
+                    revised_solution = parts[1].strip()
+                    # If the solution seems too short (might be partial), don't accept it
+                    if len(revised_solution) < 100:  # Rough minimum length for a complete solution
+                        revised_solution = None
+            # If we didn't find a complete solution, force a recheck
             if not revised_solution:
+                logger.debug("Initial solution extraction failed, requesting a complete solution")
+                # Make a new API call specifically requesting a complete solution
+                complete_solution_prompt = f"""The previous solution had inconsistencies. Please provide a complete solution
+                from beginning to end. Start your response with exactly this phrase:
+                "Here is the revised complete solution:"
+                Then write out the entire solution, including all parts both correct and corrected.
+                Do not refer to the original solution or say any parts remain the same.
+                Original problem and verification results:
+                {initial_response}
+                SymPy Results:
+                {sympy_output}"""
+                try:
+                    message = anthropic.messages.create(
+                        model="claude-3-5-sonnet-20241022",
+                        max_tokens=4096,
+                        temperature=0.2,
+                        messages=[{"role": "user", "content": complete_solution_prompt}]
+                    )
+                    new_response = message.content[0].text
+                    if marker in new_response:
+                        parts = new_response.split(marker, maxsplit=1)
                         if len(parts) > 1:
                             revised_solution = parts[1].strip()
+                except Exception as e:
+                    logger.error(f"Error in solution recheck: {str(e)}")
         return resolution_text, has_discrepancy, revised_solution
     except Exception as e:
         logger.error(f"Error in final verification: {str(e)}")
         return f"Error in final verification: {str(e)}"
 # Create Gradio interface
 with gr.Blocks() as interface:
     gr.Markdown("# Advanced Mathematics Question Generator")