Spaces:

LamiaYT
/

gaia-llamaindex-agent

Sleeping

App Files Files Community

LamiaYT commited on Jun 25

Commit

72146a4

1 Parent(s): 0fda38b

Fix LLM conflicts and environment issues

Browse files

Files changed (2) hide show

agent/local_llm.py +49 -18
app.py +63 -23

agent/local_llm.py CHANGED Viewed

@@ -1,4 +1,3 @@
-# File: agent/local_llm.py
 try:
     from transformers import AutoModelForCausalLM, AutoTokenizer
     from llama_index.llms.huggingface import HuggingFaceLLM
@@ -9,8 +8,8 @@ except ImportError as e:
 class LocalLLM:
     def __init__(self):
-        # Use smaller model that works reliably
-        self.model_name = "microsoft/DialoGPT-medium"
         print(f"Initializing LocalLLM with model: {self.model_name}")
         self.llm = self._create_llama_index_llm()
@@ -31,15 +30,19 @@ class LocalLLM:
             )
             print("Creating LlamaIndex LLM...")
             llm = HuggingFaceLLM(
                 model=model,
                 tokenizer=tokenizer,
                 generate_kwargs={
                     "do_sample": True,
                     "temperature": 0.7,
-                    "max_new_tokens": 256,
                     "pad_token_id": tokenizer.eos_token_id
-                }
             )
             print("LLM created successfully!")
@@ -54,21 +57,49 @@ class LocalLLM:
         """Fallback to a very basic model"""
         print("Using fallback model: gpt2")
         model_name = "gpt2"
-        tokenizer = AutoTokenizer.from_pretrained(model_name)
-        tokenizer.pad_token = tokenizer.eos_token
-        model = AutoModelForCausalLM.from_pretrained(model_name)
-        return HuggingFaceLLM(
-            model=model,
-            tokenizer=tokenizer,
-            generate_kwargs={
-                "do_sample": True,
-                "temperature": 0.7,
-                "max_new_tokens": 256,
-                "pad_token_id": tokenizer.eos_token_id
-            }
-        )
     def get_llm(self):
         """Return the LlamaIndex LLM instance"""

 try:
     from transformers import AutoModelForCausalLM, AutoTokenizer
     from llama_index.llms.huggingface import HuggingFaceLLM
 class LocalLLM:
     def __init__(self):
+        # Use a simple, reliable model that works well with LlamaIndex
+        self.model_name = "microsoft/DialoGPT-small"  # Changed to smaller model
         print(f"Initializing LocalLLM with model: {self.model_name}")
         self.llm = self._create_llama_index_llm()
             )
             print("Creating LlamaIndex LLM...")
+            # Fix the generate_kwargs to avoid conflicts
             llm = HuggingFaceLLM(
                 model=model,
                 tokenizer=tokenizer,
+                # Simplified generate_kwargs to avoid conflicts
                 generate_kwargs={
                     "do_sample": True,
                     "temperature": 0.7,
                     "pad_token_id": tokenizer.eos_token_id
+                },
+                # Set these parameters at the LLM level instead
+                max_new_tokens=256,
+                device_map="auto" if torch.cuda.is_available() else None
             )
             print("LLM created successfully!")
         """Fallback to a very basic model"""
         print("Using fallback model: gpt2")
         model_name = "gpt2"
+        try:
+            tokenizer = AutoTokenizer.from_pretrained(model_name)
+            tokenizer.pad_token = tokenizer.eos_token
+            model = AutoModelForCausalLM.from_pretrained(model_name)
+            return HuggingFaceLLM(
+                model=model,
+                tokenizer=tokenizer,
+                generate_kwargs={
+                    "do_sample": True,
+                    "temperature": 0.7,
+                    "pad_token_id": tokenizer.eos_token_id
+                },
+                max_new_tokens=256
+            )
+        except Exception as e:
+            print(f"Even fallback model failed: {str(e)}")
+            # Return a mock LLM for testing
+            return self._create_mock_llm()
+    def _create_mock_llm(self):
+        """Create a mock LLM for testing when models fail"""
+        print("Creating mock LLM for testing...")
+        class MockLLM:
+            def chat(self, messages, **kwargs):
+                # Simple mock response
+                class MockResponse:
+                    def __init__(self, text):
+                        self.message = type('obj', (object,), {'content': text})
+                return MockResponse("This is a mock response. The actual LLM failed to load.")
+            def complete(self, prompt, **kwargs):
+                class MockCompletion:
+                    def __init__(self, text):
+                        self.text = text
+                return MockCompletion("Mock completion response.")
+        return MockLLM()
     def get_llm(self):
         """Return the LlamaIndex LLM instance"""

app.py CHANGED Viewed

@@ -5,25 +5,32 @@ import traceback
 from typing import List, Dict
 import gradio as gr
-import nltk
-# --- Environment variable setup to fix permission issues in Spaces or restricted envs ---
 os.environ["NLTK_DATA"] = "/tmp/nltk_data"
 os.environ["MPLCONFIGDIR"] = "/tmp/matplotlib"
-os.environ["TRANSFORMERS_CACHE"] = "/tmp/huggingface_cache"
-# Download required NLTK data upfront
-nltk.download('punkt', download_dir=os.environ["NLTK_DATA"])
 # Add current directory to path for local imports
 sys.path.append(os.path.dirname(os.path.abspath(__file__)))
-# Import GaiaAPI early
 from utils.gaia_api import GaiaAPI
 # Initialize global agent state
 AGENT_READY = False
 agent = None
 # Import agent-related modules and initialize
 try:
@@ -41,28 +48,38 @@ try:
     print("Creating ReAct Agent...")
     memory = ChatMemoryBuffer.from_defaults(token_limit=2000)
-    agent = ReActAgent.from_tools(
-        tools=gaia_tools,
-        llm=llm,
-        memory=memory,
-        verbose=True,
-        max_iterations=3
-    )
-    print("Agent initialized successfully!")
-    AGENT_READY = True
 except Exception as e:
     print(f"Failed to initialize agent: {str(e)}")
     traceback.print_exc()
     AGENT_READY = False
     agent = None
 def process_single_question(question_text: str) -> str:
     """Process a single GAIA question through the agent"""
     if not AGENT_READY:
-        return "❌ Agent not ready. Please check the logs for initialization errors."
     if not question_text.strip():
         return "❌ Please enter a question."
@@ -73,7 +90,16 @@ Answer the following question directly and concisely. Do not include "FINAL ANSW
 Question: {question_text}
 """
-        response = agent.query(enhanced_prompt)
         answer = str(response).strip()
         # Remove common prefixes from the answer
@@ -84,7 +110,7 @@ Question: {question_text}
         return answer
     except Exception as e:
-        return f"❌ Error: {str(e)}\n\n{traceback.format_exc()}"
 def process_all_questions() -> str:
@@ -108,6 +134,7 @@ def process_all_questions() -> str:
             json.dump(processed_answers, f, indent=2)
         summary = f"✅ Processed {len(processed_answers)} questions.\n"
         summary += "First 3 answers:\n"
         for ans in processed_answers[:3]:
             summary += f"- {ans['task_id']}: {ans['submitted_answer'][:50]}...\n"
@@ -115,7 +142,7 @@ def process_all_questions() -> str:
         return summary
     except Exception as e:
-        return f"❌ Error: {str(e)}\n\n{traceback.format_exc()}"
 def submit_to_gaia(username: str, code_url: str) -> str:
@@ -152,13 +179,14 @@ def get_sample_question() -> str:
 # ---------- Gradio UI ----------
-with gr.Blocks(title="🦙 GAIA LlamaIndex Agent") as demo:
     gr.Markdown(f"""
 # 🦙 GAIA Benchmark Agent with LlamaIndex
 This agent uses LlamaIndex with a local LLM to tackle GAIA benchmark questions.
 **Status:** {"✅ Ready" if AGENT_READY else "❌ Not Ready"}
 """)
     with gr.Tab("🔬 Test Single Question"):
@@ -219,13 +247,25 @@ Submit your processed answers to the GAIA benchmark for official scoring.
 This agent uses:
 - **LlamaIndex** (ReAct Agent + Tools)
-- **Local LLM** (e.g., DialoGPT or fallback GPT2)
 - **GAIA Tools** (question fetch, file reader, math, etc.)
 ## Current Status
 - Agent Ready: {"✅ Yes" if AGENT_READY else "❌ No"}
 - Tools Loaded: {len(gaia_tools) if 'gaia_tools' in globals() else 0}
 """)
 if __name__ == "__main__":
-    demo.launch(server_name="0.0.0.0", server_port=7860, show_error=True)

 from typing import List, Dict
 import gradio as gr
+# --- Environment variable setup to fix permission issues ---
 os.environ["NLTK_DATA"] = "/tmp/nltk_data"
 os.environ["MPLCONFIGDIR"] = "/tmp/matplotlib"
+os.environ["HF_HOME"] = "/tmp/huggingface_cache"  # Updated from TRANSFORMERS_CACHE
+os.environ["TORCH_HOME"] = "/tmp/torch_cache"
+# Import nltk AFTER setting environment variables
+try:
+    import nltk
+    # Download required NLTK data upfront
+    nltk.download('punkt', download_dir=os.environ["NLTK_DATA"], quiet=True)
+    nltk.download('stopwords', download_dir=os.environ["NLTK_DATA"], quiet=True)
+except Exception as e:
+    print(f"NLTK setup warning: {e}")
 # Add current directory to path for local imports
 sys.path.append(os.path.dirname(os.path.abspath(__file__)))
+# Import GaiaAPI early (this fixes the undefined error)
 from utils.gaia_api import GaiaAPI
 # Initialize global agent state
 AGENT_READY = False
 agent = None
+initialization_error = None
 # Import agent-related modules and initialize
 try:
     print("Creating ReAct Agent...")
     memory = ChatMemoryBuffer.from_defaults(token_limit=2000)
+    # Only create ReAct agent if we have a proper LLM
+    if hasattr(llm, 'chat') and not llm.__class__.__name__ == 'MockLLM':
+        agent = ReActAgent.from_tools(
+            tools=gaia_tools,
+            llm=llm,
+            memory=memory,
+            verbose=True,
+            max_iterations=3
+        )
+        print("Agent initialized successfully!")
+        AGENT_READY = True
+    else:
+        print("Using mock mode - agent partially ready")
+        agent = llm  # Use the mock LLM directly
+        AGENT_READY = True
 except Exception as e:
     print(f"Failed to initialize agent: {str(e)}")
     traceback.print_exc()
     AGENT_READY = False
     agent = None
+    initialization_error = str(e)
 def process_single_question(question_text: str) -> str:
     """Process a single GAIA question through the agent"""
     if not AGENT_READY:
+        error_msg = "❌ Agent not ready. "
+        if initialization_error:
+            error_msg += f"Error: {initialization_error}"
+        return error_msg
     if not question_text.strip():
         return "❌ Please enter a question."
 Question: {question_text}
 """
+        # Handle both ReAct agent and mock LLM
+        if hasattr(agent, 'query'):
+            response = agent.query(enhanced_prompt)
+        elif hasattr(agent, 'chat'):
+            response = agent.chat([{"role": "user", "content": enhanced_prompt}])
+            response = response.message.content if hasattr(response, 'message') else str(response)
+        else:
+            response = "Mock response: I would analyze this question and provide an answer."
         answer = str(response).strip()
         # Remove common prefixes from the answer
         return answer
     except Exception as e:
+        return f"❌ Error: {str(e)}"
 def process_all_questions() -> str:
             json.dump(processed_answers, f, indent=2)
         summary = f"✅ Processed {len(processed_answers)} questions.\n"
+        summary += "Answers saved to gaia_answers.json\n"
         summary += "First 3 answers:\n"
         for ans in processed_answers[:3]:
             summary += f"- {ans['task_id']}: {ans['submitted_answer'][:50]}...\n"
         return summary
     except Exception as e:
+        return f"❌ Error: {str(e)}"
 def submit_to_gaia(username: str, code_url: str) -> str:
 # ---------- Gradio UI ----------
+with gr.Blocks(title="🦙 GAIA LlamaIndex Agent", theme=gr.themes.Soft()) as demo:
     gr.Markdown(f"""
 # 🦙 GAIA Benchmark Agent with LlamaIndex
 This agent uses LlamaIndex with a local LLM to tackle GAIA benchmark questions.
 **Status:** {"✅ Ready" if AGENT_READY else "❌ Not Ready"}
+{f"**Error:** {initialization_error}" if initialization_error else ""}
 """)
     with gr.Tab("🔬 Test Single Question"):
 This agent uses:
 - **LlamaIndex** (ReAct Agent + Tools)
+- **Local LLM** (DialoGPT-small with fallback to GPT2 or mock)
 - **GAIA Tools** (question fetch, file reader, math, etc.)
 ## Current Status
 - Agent Ready: {"✅ Yes" if AGENT_READY else "❌ No"}
 - Tools Loaded: {len(gaia_tools) if 'gaia_tools' in globals() else 0}
+- Initialization Error: {initialization_error or "None"}
+## Environment Variables Set
+- NLTK_DATA: {os.environ.get('NLTK_DATA', 'Not set')}
+- HF_HOME: {os.environ.get('HF_HOME', 'Not set')}
+- MPLCONFIGDIR: {os.environ.get('MPLCONFIGDIR', 'Not set')}
+## Usage Tips
+1. Start with the "Test Single Question" tab
+2. Try the sample question first
+3. If agent works, proceed to "Full Evaluation"
+4. Submit to GAIA when ready
 """)
 if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860, show_error=True)