Spaces:

palbha
/

websearch_agent

Running

App Files Files Community

palbha commited on Mar 8

Commit

9a894d2

verified ·

1 Parent(s): 59a00f5

Update app.py

Browse files

Files changed (1) hide show

app.py +83 -61

app.py CHANGED Viewed

@@ -1,72 +1,94 @@
 import gradio as gr
-from smolagents import CodeAgent, HfApiModel  # adjust the import to your actual smolagents module
-# Step 1: Set up your smolagents agent.
-def create_agent():
     """
-    Initialize and return the agent.
-    Adjust parameters like model type or configuration as needed.
     """
-    # For example, we initialize a CodeAgent with a sample model.
-    agent = CodeAgent(
-        tools=[],
-        model=HfApiModel(model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud/')
     )
-    return agent
-# Create the agent instance once so that it persists across user interactions.
-agent = create_agent()
-def combine_messages(messages: list[dict]) -> str:
-    """
-    Helper function to combine a list of message dictionaries into a single string.
-    Each message is prefixed with its role.
-    """
-    conversation = ""
-    for msg in messages:
-        # Capitalize the role (e.g., 'User' instead of 'user') for clarity.
-        conversation += f"{msg['role'].capitalize()}: {msg['content']}\n"
-    return conversation.strip()
-def respond(message, history: list[tuple[str, str]], system_message, max_tokens, temperature, top_p):
-    """
-    Build the conversation history, combine messages into a single string prompt,
-    call the smolagents agent, and stream the response back to Gradio.
-    """
-    # Build the conversation messages list, starting with the system prompt.
-    messages = [{"role": "system", "content": system_message}]
-    for user_msg, assistant_msg in history:
-        if user_msg:
-            messages.append({"role": "user", "content": user_msg})
-        if assistant_msg:
-            messages.append({"role": "assistant", "content": assistant_msg})
-    # Add the latest user input.
-    messages.append({"role": "user", "content": message})
-    # Combine the list of messages into a single string prompt.
-    prompt = combine_messages(messages)
-    # Now call the agent with the prompt.
-    complete_response = agent.run(prompt)
-    yield complete_response
-# Step 3: Create the Gradio ChatInterface.
-demo = gr.ChatInterface(
-    fn=respond,
-    additional_inputs=[
-        gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
-        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
-        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
-        gr.Slider(
-            minimum=0.1,
-            maximum=1.0,
-            value=0.95,
-            step=0.05,
-            label="Top-p (nucleus sampling)"
-        ),
-    ],
-)
-# Step 4: Launch the Gradio app.
-if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
+from smolagents import CodeAgent,HfApiModel DuckDuckGoSearchTool, tool
+from smolagents.agents import ActionStep
+from time import sleep
+import helium
+from PIL import Image
+from io import BytesIO
+import os
+# Define a function to search images and return the image path for display
+@tool
+def search_images_for_presentation(query: str):
     """
+    Searches for images related to the given query on the web (using DuckDuckGo search).
+    Args:
+        query: The query to search for images or logos.
     """
+    helium.go_to("https://duckduckgo.com/")
+    search_box = helium.find(S("input[type='text']"))
+    search_box.write(query)
+    search_box.press(Keys.ENTER)
+    # Wait for search results to load
+    sleep(3)
+    # Scroll down and search for images related to the query
+    search_item_ctrl_f("image", nth_result=1)
+    # Simulate an image being found (as example)
+    image_path = "path/to/some_image.png"  # Replace with actual image capture logic
+    return image_path
+# Modified tool to capture screenshots and return image path
+def save_image_from_browser(memory_step: ActionStep, agent: CodeAgent) -> None:
+    sleep(1.0)  # Allow browser elements to load
+    driver = helium.get_driver()
+    current_step = memory_step.step_number
+    if driver is not None:
+        # Capture browser screenshot
+        png_bytes = driver.get_screenshot_as_png()
+        image = Image.open(BytesIO(png_bytes))
+        image_dir = "images"
+        os.makedirs(image_dir, exist_ok=True)
+        image_path = f"{image_dir}/captured_image_{current_step}.png"
+        # Save image locally
+        image.save(image_path)
+        print(f"Captured and saved an image: {image_path}")
+        memory_step.observations_images = [image.copy()]
+    # Update observations with the current URL for reference:
+    url_info = f"Current url: {driver.current_url}"
+    memory_step.observations = (
+        url_info if memory_step.observations is None else memory_step.observations + "\n" + url_info
     )
+    return image_path
+# Initialize agent (same as before)
+def initialize_agent(model):
+    return CodeAgent(
+        tools=[DuckDuckGoSearchTool(), save_image_from_browser, search_images_for_presentation],
+        model=model,
+        max_steps=20,
+        verbosity_level=2,
+    )
+def run_agent(query: str):
+    model = HfApiModel(model_id='https://pflgm2locj2t89co.us-east-1.aws.endpoints.huggingface.cloud/')
+    agent = initialize_agent(model)
+    result = agent.run(find_images_for_presentation_prompt + query)
+    return result
+# Gradio interface to show images
+def gradio_interface(query: str):
+    # Call the agent to run the query and return the image
+    image_path = run_agent(query)
+    # Return the image to Gradio for display
+    return image_path
+# Set up Gradio interface
+gr.Interface(
+    fn=gradio_interface,
+    inputs="text",  # Text input for the search query
+    outputs=gr.Image(),  # Image output to display the fetched image
+    title="Figure, Image & Logo Finder",
+    description="Enter a query to search for relevant images, logos, or figures for your presentation."
+).launch()