Final_Assignment_Template

Runtime error

App Files Files Community

LamiaYT commited on Jun 27

Commit

0f20e93

1 Parent(s): 9af743f

Last

Browse files

Files changed (1) hide show

app.py +498 -189

app.py CHANGED Viewed

@@ -4,13 +4,91 @@ import requests
 import pandas as pd
 import re
 import time
-from typing import Dict, Any, List, Optional
-from io import StringIO
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-class WebSearchEngine:
-    """Unified web search with Serper API"""
     def __init__(self):
         self.session = requests.Session()
@@ -18,99 +96,267 @@ class WebSearchEngine:
             'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36'
         })
         self.serper_api_key = os.getenv("SERPER_API_KEY")
-    def search_with_serper(self, query: str) -> Dict[str, Any]:
-        """Search using Serper API"""
         if not self.serper_api_key:
             return {}
         try:
-            url = "https://google.serper.dev/search"
-            payload = {"q": query, "num": 10}
-            headers = {"X-API-KEY": self.serper_api_key, "Content-Type": "application/json"}
-            response = self.session.post(url, json=payload, headers=headers, timeout=15)
-            return response.json() if response.status_code == 200 else {}
         except Exception as e:
             print(f"Serper API error: {e}")
             return {}
-    def comprehensive_search(self, query: str) -> str:
-        """Search with enhanced answer extraction"""
-        print(f"🔍 Searching: {query[:80]}...")
-        data = self.search_with_serper(query)
-        if not data:
-            return "No search results found"
-        # Extract direct answer if available
-        if "answerBox" in data:
-            answer = data["answerBox"].get("answer") or data["answerBox"].get("snippet")
-            if answer:
-                return f"Direct Answer: {answer}"
-        # Process organic results with relevance filtering
-        results = []
-        for result in data.get("organic", [])[:5]:
-            title = result.get("title", "")
-            snippet = result.get("snippet", "")
-            link = result.get("link", "")
-            # Skip irrelevant or empty results
-            if not title or not snippet or not link:
-                continue
-            # Filter for high-quality sources
-            if any(d in link for d in ["wikipedia.org", "britannica.com", "official"]):
-                results.append(f"## {title}\n{snippet}\nSource: {link}")
-        return "\n\n".join(results) if results else "No relevant information found"
-class QuestionSolver:
-    """Enhanced question solving engine"""
     def __init__(self):
-        self.search_engine = WebSearchEngine()
-    def solve_question(self, question: str) -> str:
-        """Enhanced question solving logic"""
         print(f"🤔 Analyzing: {question[:100]}...")
-        # Handle reversed text questions
-        if self.is_reversed_text(question):
-            return self.handle_reversed_text(question)
-        # Handle mathematical questions
         if self.is_math_question(question):
             return self.handle_math_question(question)
-        # Handle specific question types with custom parsers
-        if self.is_specific_type(question):
-            return self.handle_specific_type(question)
-        # Default: factual questions with enhanced search
-        return self.handle_factual_question(question)
-    def is_reversed_text(self, question: str) -> bool:
-        """Detect reversed text"""
-        return any(w in question.lower() for w in ['etisoppo', 'tfel', 'thgir'])
-    def handle_reversed_text(self, question: str) -> str:
-        """Handle reversed text questions"""
         try:
-            reversed_q = question[::-1]
-            return "right" if 'left' in reversed_q.lower() else "left"
-        except:
-            return "Error processing reversed text"
     def is_math_question(self, question: str) -> bool:
         """Detect mathematical questions"""
-        math_keywords = ['calculate', 'compute', 'sum', 'how many', 'how much', 'solve']
-        return any(k in question.lower() for k in math_keywords)
     def handle_math_question(self, question: str) -> str:
-        """Handle mathematical questions with enhanced parsing"""
-        # Extract all potential math expressions
         expressions = re.findall(r'\b\d+\s*[\+\-\*\/]\s*\d+\b', question)
         for expr in expressions:
             try:
@@ -119,105 +365,131 @@ class QuestionSolver:
             except:
                 continue
-        # For non-expression math questions, use targeted search
-        return self.search_engine.comprehensive_search(question)
-    def is_specific_type(self, question: str) -> bool:
-        """Detect questions needing special handling"""
-        patterns = [
-            r'country code',
-            r'first name',
-            r'last name',
-            r'video.*youtube\.com'
         ]
-        return any(re.search(p, question.lower()) for p in patterns)
-    def handle_specific_type(self, question: str) -> str:
-        """Specialized handlers for known question types"""
-        q_lower = question.lower()
-        # Country code questions
-        if 'country code' in q_lower:
-            return self.handle_country_code_question(question)
-        # Name extraction questions
-        if 'first name' in q_lower or 'last name' in q_lower:
-            return self.handle_name_question(question)
-        # Video-related questions
-        if 'youtube.com' in q_lower:
-            return "Video content processing not implemented"
-        return self.handle_factual_question(question)
-    def handle_country_code_question(self, question: str) -> str:
-        """Special handler for country code questions"""
-        # Extract country name using regex
-        country_match = re.search(r'country (?:named|called|is) (\w+)', question, re.I)
-        if country_match:
-            country = country_match.group(1)
-            return self.search_engine.comprehensive_search(f"{country} IOC country code")
-        return "Could not identify country name"
-    def handle_name_question(self, question: str) -> str:
-        """Special handler for name extraction questions"""
-        search_result = self.search_engine.comprehensive_search(question)
-        # Enhanced name extraction
-        names = re.findall(r'\b[A-Z][a-z]+ [A-Z][a-z]+\b', search_result)
-        if not names:
-            return "Name not found"
-        full_name = names[0]
-        if 'first name' in question.lower():
-            return full_name.split()[0]
-        elif 'last name' in question.lower():
-            return full_name.split()[-1]
-        return full_name
-    def handle_factual_question(self, question: str) -> str:
-        """Handle factual questions with context-aware extraction"""
-        search_result = self.search_engine.comprehensive_search(question)
-        # Return direct answer if available
-        if search_result.startswith("Direct Answer:"):
-            return search_result.replace("Direct Answer:", "").strip()
-        # Extract most relevant number for quantitative questions
-        if any(w in question.lower() for w in ['how many', 'how much', 'number']):
-            numbers = re.findall(r'\b\d+\b', search_result)
-            return numbers[0] if numbers else "Number not found"
-        # Extract names for person-based questions
-        if any(w in question.lower() for w in ['who', 'whom', 'person']):
-            names = re.findall(r'\b[A-Z][a-z]+ [A-Z][a-z]+\b', search_result)
-            return names[0] if names else "Name not found"
-        # Default: return first meaningful snippet
-        snippets = [s for s in search_result.split('\n\n') if len(s) > 20]
-        return snippets[0] if snippets else "Answer not found"
-def get_api_status():
-    """Check Serper API status"""
-    return "✅ Serper API Configured" if os.getenv("SERPER_API_KEY") else "❌ Serper API - Get key at serper.dev"
-def run_gaia_evaluation(profile: gr.OAuthProfile | None):
-    """Run GAIA evaluation with enhanced tools"""
     if not profile:
         return "Please log in to Hugging Face first.", None
     # Check API status
-    api_status = get_api_status()
-    if "❌" in api_status:
-        return f"⚠️ API not configured!\n\n{api_status}", None
     username = profile.username
     questions_url = f"{DEFAULT_API_URL}/questions"
     submit_url = f"{DEFAULT_API_URL}/submit"
     try:
-        solver = QuestionSolver()
-        print("✅ Question solver initialized")
     except Exception as e:
         return f"❌ Initialization failed: {e}", None
@@ -236,35 +508,41 @@ def run_gaia_evaluation(profile: gr.OAuthProfile | None):
     for i, item in enumerate(questions):
         task_id = item.get("task_id")
         question = item.get("question")
         if not task_id or not question:
             continue
         print(f"\n🔄 Processing {i+1}/{len(questions)}: {task_id}")
         try:
             start_time = time.time()
-            answer = solver.solve_question(question)
             processing_time = time.time() - start_time
             answers.append({"task_id": task_id, "submitted_answer": answer})
             logs.append({
                 "Task ID": task_id,
-                "Question": question[:100] + "..." if len(question) > 100 else question,
-                "Answer": answer,
                 "Time (s)": f"{processing_time:.2f}"
             })
             print(f"✅ Answer: {answer[:80]}{'...' if len(answer) > 80 else ''}")
-            time.sleep(0.3)  # Rate limiting
         except Exception as e:
             error_msg = f"Error: {str(e)}"
             answers.append({"task_id": task_id, "submitted_answer": error_msg})
             logs.append({
                 "Task ID": task_id,
-                "Question": question,
                 "Answer": error_msg,
                 "Time (s)": "Error"
             })
             print(f"❌ Error: {e}")
@@ -278,7 +556,7 @@ def run_gaia_evaluation(profile: gr.OAuthProfile | None):
     }
     try:
-        resp = requests.post(submit_url, json=payload, timeout=180)
         resp.raise_for_status()
         data = resp.json()
@@ -286,68 +564,99 @@ def run_gaia_evaluation(profile: gr.OAuthProfile | None):
         correct = data.get('correct_count', '?')
         total = data.get('total_attempted', '?')
-        result_message = f"""🎯 GAIA EVALUATION RESULTS
-📊 Score: {score}% ({correct}/{total} correct)
-🔧 API Status:
 {api_status}
-✨ Key Improvements:
-• Enhanced answer extraction logic
-• Specialized handlers for common types
-• Context-aware result filtering
-• Direct answer prioritization
-• Advanced pattern matching"""
         return result_message, pd.DataFrame(logs)
     except Exception as e:
         return f"❌ Submission failed: {str(e)}", pd.DataFrame(logs)
-# Gradio Interface
-with gr.Blocks(title="GAIA Agent", theme=gr.themes.Default()) as demo:
     gr.Markdown("""
-    # 🧠 GAIA Benchmark Agent
-    **🔧 Required API Key:**
-    - `SERPER_API_KEY` - Get free 2500 searches/month at [serper.dev](https://serper.dev)
-    **⚡ Enhanced Capabilities:**
-    - Precision answer extraction
-    - Specialized question handlers
-    - Mathematical problem solving
-    - Context-aware filtering
     """)
     gr.LoginButton()
     with gr.Row():
         with gr.Column():
-            api_status_text = gr.Textbox(
-                label="🔧 API Status",
-                value=get_api_status(),
-                lines=2,
                 interactive=False
             )
-            run_btn = gr.Button("🚀 Run GAIA Evaluation", variant="primary", size="lg")
     with gr.Row():
-        results_text = gr.Textbox(
-            label="📊 Results",
-            lines=10,
             interactive=False
         )
     with gr.Row():
-        results_table = gr.DataFrame(
-            label="📋 Question Details",
-            wrap=True
         )
-    run_btn.click(
-        run_gaia_evaluation,
-        outputs=[results_text, results_table]
     )
 if __name__ == "__main__":

 import pandas as pd
 import re
 import time
+import json
+import base64
+from typing import Dict, Any, List, Optional, Tuple
+from io import StringIO, BytesIO
+import openpyxl
+from PIL import Image
+import PyPDF2
+import ast
+import math
+import statistics
+from datetime import datetime, timedelta
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+class FileProcessor:
+    """Handle various file types that GAIA questions might reference"""
+    @staticmethod
+    def process_excel_file(file_path: str) -> Dict[str, Any]:
+        """Process Excel files and extract data"""
+        try:
+            # Try multiple sheet reading approaches
+            excel_data = {}
+            workbook = openpyxl.load_workbook(file_path, data_only=True)
+            for sheet_name in workbook.sheetnames:
+                sheet = workbook[sheet_name]
+                data = []
+                for row in sheet.iter_rows(values_only=True):
+                    if any(cell is not None for cell in row):
+                        data.append(row)
+                excel_data[sheet_name] = data
+            return excel_data
+        except Exception as e:
+            print(f"Excel processing error: {e}")
+            return {}
+    @staticmethod
+    def process_python_code(code_content: str) -> str:
+        """Execute Python code safely and return output"""
+        try:
+            # Create a safe execution environment
+            safe_globals = {
+                '__builtins__': {
+                    'print': print, 'len': len, 'range': range, 'sum': sum,
+                    'max': max, 'min': min, 'abs': abs, 'round': round,
+                    'int': int, 'float': float, 'str': str, 'list': list,
+                    'dict': dict, 'set': set, 'tuple': tuple
+                },
+                'math': math,
+                'statistics': statistics
+            }
+            # Capture output
+            import io
+            import sys
+            old_stdout = sys.stdout
+            sys.stdout = captured_output = io.StringIO()
+            try:
+                exec(code_content, safe_globals)
+                output = captured_output.getvalue()
+            finally:
+                sys.stdout = old_stdout
+            return output.strip()
+        except Exception as e:
+            return f"Code execution error: {e}"
+    @staticmethod
+    def process_pdf_file(file_path: str) -> str:
+        """Extract text from PDF files"""
+        try:
+            with open(file_path, 'rb') as file:
+                pdf_reader = PyPDF2.PdfReader(file)
+                text = ""
+                for page in pdf_reader.pages:
+                    text += page.extract_text() + "\n"
+                return text.strip()
+        except Exception as e:
+            return f"PDF processing error: {e}"
+class AdvancedWebSearchEngine:
+    """Enhanced web search with multiple strategies"""
     def __init__(self):
         self.session = requests.Session()
             'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36'
         })
         self.serper_api_key = os.getenv("SERPER_API_KEY")
+        self.search_cache = {}
+    def search_with_serper(self, query: str, search_type: str = "search") -> Dict[str, Any]:
+        """Enhanced Serper API search with different types"""
         if not self.serper_api_key:
             return {}
+        # Check cache first
+        cache_key = f"{query}_{search_type}"
+        if cache_key in self.search_cache:
+            return self.search_cache[cache_key]
         try:
+            url = f"https://google.serper.dev/{search_type}"
+            payload = {
+                "q": query,
+                "num": 15,  # Get more results
+                "gl": "us",  # US results
+                "hl": "en"   # English language
+            }
+            headers = {
+                "X-API-KEY": self.serper_api_key,
+                "Content-Type": "application/json"
+            }
+            response = self.session.post(url, json=payload, headers=headers, timeout=20)
+            result = response.json() if response.status_code == 200 else {}
+            # Cache the result
+            self.search_cache[cache_key] = result
+            return result
         except Exception as e:
             print(f"Serper API error: {e}")
             return {}
+    def multi_strategy_search(self, query: str) -> Dict[str, Any]:
+        """Try multiple search strategies for better results"""
+        results = {}
+        # Primary search
+        primary = self.search_with_serper(query)
+        if primary:
+            results['primary'] = primary
+        # Try variations if primary doesn't yield good results
+        variations = [
+            f'"{query}"',  # Exact phrase
+            f"{query} site:wikipedia.org",  # Wikipedia specific
+            f"{query} facts information",  # More specific
+        ]
+        for i, variation in enumerate(variations):
+            if len(results) < 2:  # Don't overdo it
+                var_result = self.search_with_serper(variation)
+                if var_result and var_result != primary:
+                    results[f'variation_{i}'] = var_result
+        return results
+    def extract_answer_from_results(self, results: Dict[str, Any], question: str) -> str:
+        """Advanced answer extraction from search results"""
+        all_content = []
+        for result_type, data in results.items():
+            # Extract answer box
+            if "answerBox" in data:
+                answer_box = data["answerBox"]
+                if "answer" in answer_box:
+                    return answer_box["answer"]
+                elif "snippet" in answer_box:
+                    return answer_box["snippet"]
+            # Extract knowledge graph
+            if "knowledgeGraph" in data:
+                kg = data["knowledgeGraph"]
+                if "description" in kg:
+                    all_content.append(kg["description"])
+            # Extract organic results
+            for organic in data.get("organic", []):
+                title = organic.get("title", "")
+                snippet = organic.get("snippet", "")
+                if title and snippet:
+                    all_content.append(f"{title}: {snippet}")
+        # Combine all content
+        combined_content = "\n".join(all_content)
+        # Apply question-specific extraction
+        return self.extract_specific_answer(combined_content, question)
+    def extract_specific_answer(self, content: str, question: str) -> str:
+        """Extract specific answers based on question type"""
+        q_lower = question.lower()
+        # Numbers and quantities
+        if any(word in q_lower for word in ['how many', 'how much', 'number of', 'count']):
+            numbers = re.findall(r'\b\d{1,10}\b', content)
+            if numbers:
+                # Return the most likely number (often the first one found)
+                return numbers[0]
+        # Names and people
+        if any(word in q_lower for word in ['who', 'whom', 'name', 'person']):
+            # Look for proper names (capitalized words)
+            names = re.findall(r'\b[A-Z][a-z]+ [A-Z][a-z]+(?:\s[A-Z][a-z]+)*\b', content)
+            if names:
+                if 'first name' in q_lower:
+                    return names[0].split()[0]
+                elif 'last name' in q_lower or 'surname' in q_lower:
+                    return names[0].split()[-1]
+                else:
+                    return names[0]
+        # Dates and years
+        if any(word in q_lower for word in ['when', 'year', 'date']):
+            years = re.findall(r'\b(19|20)\d{2}\b', content)
+            if years:
+                return years[0]
+            dates = re.findall(r'\b\w+ \d{1,2}, \d{4}\b', content)
+            if dates:
+                return dates[0]
+        # Places and locations
+        if any(word in q_lower for word in ['where', 'location', 'place', 'country']):
+            # Look for place names
+            places = re.findall(r'\b[A-Z][a-z]+(?:\s[A-Z][a-z]+)*(?:\s(?:City|State|Country|Province|Region))?\b', content)
+            if places:
+                return places[0]
+        # Country codes
+        if 'country code' in q_lower:
+            codes = re.findall(r'\b[A-Z]{2,3}\b', content)
+            if codes:
+                return codes[0]
+        # Default: return first meaningful sentence
+        sentences = [s.strip() for s in content.split('.') if len(s.strip()) > 20]
+        return sentences[0] if sentences else "Answer not found in search results"
+class EnhancedQuestionSolver:
+    """Advanced question solver with multiple reasoning strategies"""
     def __init__(self):
+        self.search_engine = AdvancedWebSearchEngine()
+        self.file_processor = FileProcessor()
+    def solve_question(self, question: str, files: List[str] = None) -> str:
+        """Main question solving method with multiple strategies"""
         print(f"🤔 Analyzing: {question[:100]}...")
+        # Handle file-based questions first
+        if files:
+            file_answer = self.handle_file_based_question(question, files)
+            if file_answer and file_answer != "File processing failed":
+                return file_answer
+        # Detect file references in question text
+        if self.has_file_references(question):
+            return self.handle_file_reference_question(question)
+        # Handle mathematical calculations
         if self.is_math_question(question):
             return self.handle_math_question(question)
+        # Handle multi-step reasoning questions
+        if self.needs_multi_step_reasoning(question):
+            return self.handle_multi_step_question(question)
+        # Handle specific structured questions
+        return self.handle_structured_question(question)
+    def has_file_references(self, question: str) -> bool:
+        """Check if question references files"""
+        file_indicators = [
+            "attached", "excel file", "python code", "pdf", "image",
+            "spreadsheet", "document", "file contains", "in the file"
+        ]
+        return any(indicator in question.lower() for indicator in file_indicators)
+    def handle_file_reference_question(self, question: str) -> str:
+        """Handle questions that reference files but files aren't provided"""
+        # Try to search for the specific content mentioned
+        if "excel file" in question.lower() and "sales" in question.lower():
+            return "Unable to access attached Excel file. Please ensure file is properly uploaded."
+        elif "python code" in question.lower():
+            return "Unable to access attached Python code. Please ensure file is properly uploaded."
+        else:
+            return "File referenced but not accessible. Please provide the file."
+    def handle_file_based_question(self, question: str, files: List[str]) -> str:
+        """Handle questions that involve file processing"""
+        try:
+            for file_path in files:
+                if file_path.endswith('.xlsx') or file_path.endswith('.xls'):
+                    excel_data = self.file_processor.process_excel_file(file_path)
+                    return self.analyze_excel_data(excel_data, question)
+                elif file_path.endswith('.py'):
+                    with open(file_path, 'r') as f:
+                        code_content = f.read()
+                    return self.file_processor.process_python_code(code_content)
+                elif file_path.endswith('.pdf'):
+                    pdf_text = self.file_processor.process_pdf_file(file_path)
+                    return self.analyze_text_content(pdf_text, question)
+        except Exception as e:
+            return f"File processing failed: {e}"
+        return "File processing failed"
+    def analyze_excel_data(self, excel_data: Dict, question: str) -> str:
+        """Analyze Excel data to answer questions"""
+        if not excel_data:
+            return "No data found in Excel file"
+        # Convert to DataFrame for analysis
         try:
+            for sheet_name, data in excel_data.items():
+                if data:
+                    df = pd.DataFrame(data[1:], columns=data[0])  # First row as header
+                    # Handle sales analysis questions
+                    if "sales" in question.lower():
+                        if "total" in question.lower():
+                            numeric_cols = df.select_dtypes(include=[int, float]).columns
+                            if len(numeric_cols) > 0:
+                                return str(df[numeric_cols[0]].sum())
+                        elif "average" in question.lower():
+                            numeric_cols = df.select_dtypes(include=[int, float]).columns
+                            if len(numeric_cols) > 0:
+                                return str(df[numeric_cols[0]].mean())
+            return "Could not analyze Excel data for this question"
+        except Exception as e:
+            return f"Excel analysis error: {e}"
+    def analyze_text_content(self, text: str, question: str) -> str:
+        """Analyze text content to find answers"""
+        # Look for specific patterns based on question
+        if "surname" in question.lower() or "last name" in question.lower():
+            names = re.findall(r'\b[A-Z][a-z]+ [A-Z][a-z]+\b', text)
+            if names:
+                return names[0].split()[-1]
+        # Use search to find more specific information
+        search_query = f"{question} {text[:100]}"
+        results = self.search_engine.multi_strategy_search(search_query)
+        return self.search_engine.extract_answer_from_results(results, question)
     def is_math_question(self, question: str) -> bool:
         """Detect mathematical questions"""
+        math_indicators = [
+            'calculate', 'compute', 'sum', 'average', 'mean',
+            'total', 'how many', 'how much', 'solve', 'equation'
+        ]
+        return any(indicator in question.lower() for indicator in math_indicators)
     def handle_math_question(self, question: str) -> str:
+        """Handle mathematical questions"""
+        # Try to extract and solve mathematical expressions
         expressions = re.findall(r'\b\d+\s*[\+\-\*\/]\s*\d+\b', question)
         for expr in expressions:
             try:
             except:
                 continue
+        # For word problems, search for the answer
+        results = self.search_engine.multi_strategy_search(question)
+        return self.search_engine.extract_answer_from_results(results, question)
+    def needs_multi_step_reasoning(self, question: str) -> bool:
+        """Check if question needs multi-step reasoning"""
+        multi_step_indicators = [
+            "who played", "actor who", "person who", "after",
+            "before", "then", "subsequently", "following"
         ]
+        return any(indicator in question.lower() for indicator in multi_step_indicators)
+    def handle_multi_step_question(self, question: str) -> str:
+        """Handle questions requiring multiple steps"""
+        # Break down complex questions
+        if "actor who played" in question.lower():
+            return self.handle_actor_chain_question(question)
+        elif "before and after" in question.lower():
+            return self.handle_sequence_question(question)
+        else:
+            return self.handle_structured_question(question)
+    def handle_actor_chain_question(self, question: str) -> str:
+        """Handle questions about actors playing different roles"""
+        # Step 1: Find the initial actor/role
+        parts = question.split(" in ")
+        if len(parts) >= 2:
+            first_search = f"actor who played {parts[0].split('actor who played')[1]} in {parts[1].split(' play in')[0]}"
+            results1 = self.search_engine.multi_strategy_search(first_search)
+            actor_name = self.search_engine.extract_answer_from_results(results1, f"who is the actor")
+            if actor_name and actor_name != "Answer not found in search results":
+                # Step 2: Find what this actor played in the target show/movie
+                target = parts[1].split(" play in ")[1] if " play in " in parts[1] else parts[1]
+                second_search = f"{actor_name} role in {target}"
+                results2 = self.search_engine.multi_strategy_search(second_search)
+                return self.search_engine.extract_answer_from_results(results2, f"what role did {actor_name} play")
+        # Fallback to single search
+        results = self.search_engine.multi_strategy_search(question)
+        return self.search_engine.extract_answer_from_results(results, question)
+    def handle_sequence_question(self, question: str) -> str:
+        """Handle questions about sequences (before/after)"""
+        results = self.search_engine.multi_strategy_search(question)
+        return self.search_engine.extract_answer_from_results(results, question)
+    def handle_structured_question(self, question: str) -> str:
+        """Handle general structured questions with enhanced search"""
+        results = self.search_engine.multi_strategy_search(question)
+        answer = self.search_engine.extract_answer_from_results(results, question)
+        # If no good answer found, try rephrasing the question
+        if answer == "Answer not found in search results":
+            rephrased_questions = self.rephrase_question(question)
+            for rq in rephrased_questions:
+                results = self.search_engine.multi_strategy_search(rq)
+                answer = self.search_engine.extract_answer_from_results(results, question)
+                if answer != "Answer not found in search results":
+                    break
+        return answer
+    def rephrase_question(self, question: str) -> List[str]:
+        """Generate alternative phrasings of the question"""
+        rephrased = []
+        # Add question marks if missing
+        if not question.endswith('?'):
+            rephrased.append(question + '?')
+        # Remove question words for factual search
+        words_to_remove = ['what is', 'who is', 'where is', 'when is', 'how many', 'how much']
+        for word in words_to_remove:
+            if word in question.lower():
+                rephrased.append(question.lower().replace(word, '').strip())
+        # Add context words
+        context_words = ['information about', 'facts about', 'details about']
+        for context in context_words:
+            rephrased.append(f"{context} {question}")
+        return rephrased[:3]  # Limit to 3 rephrasings
+def get_enhanced_api_status():
+    """Check API status with more details"""
+    status = []
+    if os.getenv("SERPER_API_KEY"):
+        status.append("✅ Serper API: Configured")
+    else:
+        status.append("❌ Serper API: Missing - Get key at serper.dev")
+    # Check if we can access file processing libraries
+    try:
+        import openpyxl
+        status.append("✅ Excel Processing: Available")
+    except ImportError:
+        status.append("❌ Excel Processing: openpyxl not available")
+    try:
+        import PyPDF2
+        status.append("✅ PDF Processing: Available")
+    except ImportError:
+        status.append("❌ PDF Processing: PyPDF2 not available")
+    return "\n".join(status)
+def run_enhanced_gaia_evaluation(profile: gr.OAuthProfile | None):
+    """Run GAIA evaluation with enhanced solving capabilities"""
     if not profile:
         return "Please log in to Hugging Face first.", None
     # Check API status
+    api_status = get_enhanced_api_status()
+    if "❌ Serper API" in api_status:
+        return f"⚠️ Serper API not configured!\n\n{api_status}", None
     username = profile.username
     questions_url = f"{DEFAULT_API_URL}/questions"
     submit_url = f"{DEFAULT_API_URL}/submit"
     try:
+        solver = EnhancedQuestionSolver()
+        print("✅ Enhanced question solver initialized")
     except Exception as e:
         return f"❌ Initialization failed: {e}", None
     for i, item in enumerate(questions):
         task_id = item.get("task_id")
         question = item.get("question")
+        files = item.get("files", [])  # Get attached files if any
         if not task_id or not question:
             continue
         print(f"\n🔄 Processing {i+1}/{len(questions)}: {task_id}")
+        print(f"📝 Question: {question[:100]}{'...' if len(question) > 100 else ''}")
+        if files:
+            print(f"📎 Files: {files}")
         try:
             start_time = time.time()
+            answer = solver.solve_question(question, files)
             processing_time = time.time() - start_time
             answers.append({"task_id": task_id, "submitted_answer": answer})
             logs.append({
                 "Task ID": task_id,
+                "Question": question[:150] + "..." if len(question) > 150 else question,
+                "Answer": answer[:100] + "..." if len(answer) > 100 else answer,
+                "Files": len(files) if files else 0,
                 "Time (s)": f"{processing_time:.2f}"
             })
             print(f"✅ Answer: {answer[:80]}{'...' if len(answer) > 80 else ''}")
+            time.sleep(0.5)  # Rate limiting for API
         except Exception as e:
             error_msg = f"Error: {str(e)}"
             answers.append({"task_id": task_id, "submitted_answer": error_msg})
             logs.append({
                 "Task ID": task_id,
+                "Question": question[:150] + "..." if len(question) > 150 else question,
                 "Answer": error_msg,
+                "Files": len(files) if files else 0,
                 "Time (s)": "Error"
             })
             print(f"❌ Error: {e}")
     }
     try:
+        resp = requests.post(submit_url, json=payload, timeout=300)  # Increased timeout
         resp.raise_for_status()
         data = resp.json()
         correct = data.get('correct_count', '?')
         total = data.get('total_attempted', '?')
+        result_message = f"""🎯 ENHANCED GAIA EVALUATION RESULTS
+📊 Final Score: {score}% ({correct}/{total} correct)
+🔧 System Status:
 {api_status}
+🚀 Enhanced Features:
+• Multi-strategy web search with result caching
+• Advanced file processing (Excel, PDF, Python)
+• Multi-step reasoning for complex questions
+• Context-aware answer extraction
+• Question rephrasing for better results
+• Specialized handlers for different question types
+📈 Performance Improvements:
+• Better search result processing
+• Enhanced name/number extraction
+• Improved mathematical computation
+• File-based question handling
+• Actor chain and sequence reasoning"""
         return result_message, pd.DataFrame(logs)
     except Exception as e:
         return f"❌ Submission failed: {str(e)}", pd.DataFrame(logs)
+# Enhanced Gradio Interface
+with gr.Blocks(title="Enhanced GAIA Agent", theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
+    # 🧠 Enhanced GAIA Benchmark Agent v2.0
+    **🔧 Required Setup:**
+    - `SERPER_API_KEY` environment variable - Get 2500 free searches/month at [serper.dev](https://serper.dev)
+    **⚡ Advanced Capabilities:**
+    - 🔍 Multi-strategy web search with intelligent caching
+    - 📊 Excel/CSV file processing and analysis
+    - 🐍 Python code execution for computational questions
+    - 📄 PDF document text extraction and analysis
+    - 🧮 Advanced mathematical problem solving
+    - 🎭 Multi-step reasoning for complex actor/person chains
+    - 🎯 Context-aware answer extraction with multiple fallbacks
+    - 📝 Question rephrasing for better search results
+    **📈 Expected Performance:**
+    - Significantly improved accuracy on GAIA benchmark
+    - Better handling of file-based questions
+    - Enhanced name/number/date extraction
+    - Robust error handling and fallback strategies
     """)
     gr.LoginButton()
     with gr.Row():
         with gr.Column():
+            api_status_display = gr.Textbox(
+                label="🔧 System Status",
+                value=get_enhanced_api_status(),
+                lines=4,
                 interactive=False
             )
+            run_button = gr.Button(
+                "🚀 Run Enhanced GAIA Evaluation",
+                variant="primary",
+                size="lg"
+            )
     with gr.Row():
+        results_display = gr.Textbox(
+            label="📊 Evaluation Results",
+            lines=15,
             interactive=False
         )
     with gr.Row():
+        detailed_results = gr.DataFrame(
+            label="📋 Detailed Question Analysis",
+            wrap=True,
+            interactive=False
         )
+    # Refresh status button
+    refresh_status = gr.Button("🔄 Refresh Status", size="sm")
+    refresh_status.click(
+        lambda: get_enhanced_api_status(),
+        outputs=[api_status_display]
+    )
+    run_button.click(
+        run_enhanced_gaia_evaluation,
+        outputs=[results_display, detailed_results]
     )
 if __name__ == "__main__":