math-exams-symvp-duo

Running

App Files Files Community

joshuarauh commited on Nov 18, 2024

Commit

109daa0

verified ·

1 Parent(s): ef21c2f

Update app.py

Browse files

Files changed (1) hide show

app.py +48 -14

app.py CHANGED Viewed

@@ -1,15 +1,51 @@
-# app.py
 import os
 import gradio as gr
 from anthropic import Anthropic
 import wolframalpha
 from datetime import datetime, timedelta
 from collections import deque
 # Initialize clients
 anthropic = Anthropic(api_key=os.environ.get('ANTHROPIC_API_KEY'))
 wolfram_client = wolframalpha.Client(os.environ.get('WOLFRAM_APPID'))
 def verify_solution(problem, claimed_solution):
     """Verify a mathematical solution using Wolfram Alpha"""
     try:
@@ -37,9 +73,13 @@ def verify_solution(problem, claimed_solution):
 def compare_solutions(wolfram_sol, claude_sol):
     """Compare two solutions for mathematical equivalence"""
-    # This would need sophisticated parsing based on your problem types
-    # Basic example:
-    return abs(float(wolfram_sol) - float(claude_sol)) < 0.001
 def generate_test(subject):
     """Generate and verify a math test"""
@@ -49,7 +89,7 @@ def generate_test(subject):
         For each question:
         1. State the problem clearly
         2. Provide your step-by-step solution
-        3. Give the final answer in a format that can be verified
         Use simple $$ for all math expressions."""
         message = anthropic.messages.create(
@@ -68,8 +108,7 @@ def generate_test(subject):
         # Add verification results
         verification_results = []
-        # For each question/solution pair (you'll need to parse the content)
-        # Example structure:
         verification_note = "\n\n## Solution Verification:\n"
         for i, (problem, solution) in enumerate(parse_questions(content)):
             result = verify_solution(problem, solution)
@@ -80,6 +119,7 @@ def generate_test(subject):
                 verification_note += "⚠️ Solution needs verification\n"
                 if result['wolfram_solution']:
                     verification_note += f"Wolfram Alpha got: {result['wolfram_solution']}\n"
         # Add usage statistics
         usage_stats = f"""
@@ -98,13 +138,7 @@ def generate_test(subject):
     except Exception as e:
         return f"Error: {str(e)}"
-# Update requirements.txt to include:
-# wolframalpha==5.0.0
-# Update environment variables to include WOLFRAM_APPID
-# Rest of your Gradio interface code remains the same...
-# Subject choices
 subjects = [
     "Single Variable Calculus",
     "Multivariable Calculus",

 import os
 import gradio as gr
 from anthropic import Anthropic
 import wolframalpha
 from datetime import datetime, timedelta
 from collections import deque
+import re
 # Initialize clients
 anthropic = Anthropic(api_key=os.environ.get('ANTHROPIC_API_KEY'))
 wolfram_client = wolframalpha.Client(os.environ.get('WOLFRAM_APPID'))
+def parse_questions(content):
+    """Parse questions and their solutions from Claude's output"""
+    # Split content into questions
+    questions = []
+    current_text = ""
+    question_pattern = re.compile(r'\d+\)')
+    # Split the content by question numbers
+    parts = re.split(question_pattern, content)
+    if len(parts) > 1:  # Skip the first empty part if it exists
+        parts = parts[1:]
+    for part in parts:
+        # Try to extract the problem and solution
+        try:
+            # Split into problem and solution (assuming "Solution:" marks the divide)
+            problem_solution = part.split("Solution:", 1)
+            if len(problem_solution) == 2:
+                problem = problem_solution[0].strip()
+                solution = problem_solution[1].strip()
+                # Extract the final numerical answer if possible
+                # This is a simple example - you'll need to adjust based on your output format
+                final_answer = re.search(r'=\s*([-+]?\d*\.?\d+)', solution)
+                if final_answer:
+                    final_answer = final_answer.group(1)
+                else:
+                    final_answer = "Not found"
+                questions.append((problem, final_answer))
+        except Exception as e:
+            print(f"Error parsing question: {e}")
+            continue
+    return questions
 def verify_solution(problem, claimed_solution):
     """Verify a mathematical solution using Wolfram Alpha"""
     try:
 def compare_solutions(wolfram_sol, claude_sol):
     """Compare two solutions for mathematical equivalence"""
+    try:
+        # Convert both solutions to floats for comparison
+        w_val = float(wolfram_sol)
+        c_val = float(claude_sol)
+        return abs(w_val - c_val) < 0.001
+    except (ValueError, TypeError):
+        return False
 def generate_test(subject):
     """Generate and verify a math test"""
         For each question:
         1. State the problem clearly
         2. Provide your step-by-step solution
+        3. End each solution with a clear final numerical answer in the format: "Final answer = [number]"
         Use simple $$ for all math expressions."""
         message = anthropic.messages.create(
         # Add verification results
         verification_results = []
+        # Parse and verify each question
         verification_note = "\n\n## Solution Verification:\n"
         for i, (problem, solution) in enumerate(parse_questions(content)):
             result = verify_solution(problem, solution)
                 verification_note += "⚠️ Solution needs verification\n"
                 if result['wolfram_solution']:
                     verification_note += f"Wolfram Alpha got: {result['wolfram_solution']}\n"
+            verification_results.append(result)
         # Add usage statistics
         usage_stats = f"""
     except Exception as e:
         return f"Error: {str(e)}"
+# Subject choices and interface configuration remain the same...
 subjects = [
     "Single Variable Calculus",
     "Multivariable Calculus",