Spaces:

mozilla-ai
/

surf-spot-finder

Running

App Files Files Community

github-actions[bot] commited on 24 days ago

Commit

178738b

1 Parent(s): 89845e5

Sync with https://github.com/mozilla-ai/surf-spot-finder

Browse files

Files changed (3) hide show

components/agent_status.py +47 -0
constants.py +5 -5
services/agent.py +63 -19

components/agent_status.py ADDED Viewed

	@@ -0,0 +1,47 @@

+from any_agent import AnyAgent
+from opentelemetry.sdk.trace.export import SimpleSpanProcessor
+from collections.abc import Sequence
+from typing import TYPE_CHECKING, Callable
+from opentelemetry.sdk.trace.export import (
+    SpanExporter,
+    SpanExportResult,
+)
+from any_agent import AgentFramework
+from any_agent.tracing import TracingProcessor
+from any_agent.tracing.trace import AgentSpan
+if TYPE_CHECKING:
+    from opentelemetry.sdk.trace import ReadableSpan
+class StreamlitExporter(SpanExporter):
+    """Build an `AgentTrace` and export to the different outputs."""
+    def __init__(  # noqa: D107
+        self, agent_framework: AgentFramework, callback: Callable
+    ):
+        self.agent_framework = agent_framework
+        self.processor: TracingProcessor | None = TracingProcessor.create(
+            agent_framework
+        )
+        self.callback = callback
+    def export(self, spans: Sequence["ReadableSpan"]) -> SpanExportResult:  # noqa: D102
+        if not self.processor:
+            return SpanExportResult.SUCCESS
+        for readable_span in spans:
+            # Check if this span belongs to our run
+            span = AgentSpan.from_readable_span(readable_span)
+            self.callback(span)
+        return SpanExportResult.SUCCESS
+def export_logs(agent: AnyAgent, callback: Callable) -> None:
+    exporter = StreamlitExporter(agent.framework, callback)
+    span_processor = SimpleSpanProcessor(exporter)
+    agent._tracer_provider.add_span_processor(span_processor)

constants.py CHANGED Viewed

@@ -31,7 +31,11 @@ DEFAULT_EVALUATION_CASE = EvaluationCase(
             "points": 1,
         },
         {
-            "criteria": "Check if the agent gathered wind and wave forecasts for each surf spot being evaluated.",
             "points": 1,
         },
         {
@@ -50,10 +54,6 @@ DEFAULT_EVALUATION_CASE = EvaluationCase(
             "criteria": "Check if the final answer includes information about some alternative surf spots if the user is not satisfied with the chosen one",
             "points": 1,
         },
-        {
-            "criteria": "Check that the agent completed in fewer than 10 calls",
-            "points": 1,
-        },
     ],
 )

             "points": 1,
         },
         {
+            "criteria": "Check if the agent gathered wind forecasts for each surf spot being evaluated.",
+            "points": 1,
+        },
+        {
+            "criteria": "Check if the agent gathered wave forecasts for each surf spot being evaluated.",
             "points": 1,
         },
         {
             "criteria": "Check if the final answer includes information about some alternative surf spots if the user is not satisfied with the chosen one",
             "points": 1,
         },
     ],
 )

services/agent.py CHANGED Viewed

@@ -1,11 +1,12 @@
 import json
 from components.inputs import UserInputs
 from constants import DEFAULT_TOOLS
 import streamlit as st
 import time
 from surf_spot_finder.config import Config
 from any_agent import AgentConfig, AnyAgent, TracingConfig, AgentFramework
-from any_agent.tracing.trace import AgentTrace, TotalTokenUseAndCost
 from any_agent.tracing.otel_types import StatusCode
 from any_agent.evaluation import evaluate, TraceEvaluationResult
@@ -102,18 +103,6 @@ async def configure_agent(user_inputs: UserInputs) -> tuple[AnyAgent, Config]:
 async def display_output(agent_trace: AgentTrace, execution_time: float):
-    cost: TotalTokenUseAndCost = agent_trace.get_total_cost()
-    with st.expander("### 🏄 Results", expanded=True):
-        time_col, cost_col, tokens_col = st.columns(3)
-        with time_col:
-            st.info(f"⏱️ Execution Time: {execution_time:.2f} seconds")
-        with cost_col:
-            st.info(f"💰 Estimated Cost: ${cost.total_cost:.6f}")
-        with tokens_col:
-            st.info(f"📦 Total Tokens: {cost.total_tokens:,}")
-        st.markdown("#### Final Output")
-        st.info(agent_trace.final_output)
     # Display the agent trace in a more organized way
     with st.expander("### 🧩 Agent Trace"):
         for span in agent_trace.spans:
@@ -150,6 +139,18 @@ async def display_output(agent_trace: AgentTrace, execution_time: float):
                     unsafe_allow_html=True,
                 )
 async def run_agent(agent, config) -> tuple[AgentTrace, float]:
     st.markdown("#### 🔍 Running Surf Spot Finder with query")
@@ -178,11 +179,54 @@ async def run_agent(agent, config) -> tuple[AgentTrace, float]:
         kwargs["run_config"] = RunConfig(max_llm_calls=20)
-    start_time = time.time()
-    with st.spinner("🤔 Analyzing surf spots..."):
         agent_trace: AgentTrace = await agent.run_async(query, **kwargs)
-        agent.exit()
-    end_time = time.time()
-    execution_time = end_time - start_time
-    return agent_trace, execution_time

 import json
 from components.inputs import UserInputs
 from constants import DEFAULT_TOOLS
+from components.agent_status import export_logs
 import streamlit as st
 import time
 from surf_spot_finder.config import Config
 from any_agent import AgentConfig, AnyAgent, TracingConfig, AgentFramework
+from any_agent.tracing.trace import AgentTrace, TotalTokenUseAndCost, AgentSpan
 from any_agent.tracing.otel_types import StatusCode
 from any_agent.evaluation import evaluate, TraceEvaluationResult
 async def display_output(agent_trace: AgentTrace, execution_time: float):
     # Display the agent trace in a more organized way
     with st.expander("### 🧩 Agent Trace"):
         for span in agent_trace.spans:
                     unsafe_allow_html=True,
                 )
+    cost: TotalTokenUseAndCost = agent_trace.get_total_cost()
+    with st.expander("### 🏄 Results", expanded=True):
+        time_col, cost_col, tokens_col = st.columns(3)
+        with time_col:
+            st.info(f"⏱️ Execution Time: {execution_time:.2f} seconds")
+        with cost_col:
+            st.info(f"💰 Estimated Cost: ${cost.total_cost:.6f}")
+        with tokens_col:
+            st.info(f"📦 Total Tokens: {cost.total_tokens:,}")
+        st.markdown("#### Final Output")
+        st.info(agent_trace.final_output)
 async def run_agent(agent, config) -> tuple[AgentTrace, float]:
     st.markdown("#### 🔍 Running Surf Spot Finder with query")
         kwargs["run_config"] = RunConfig(max_llm_calls=20)
+    with st.status("Agent is running...", expanded=False, state="running") as status:
+        def update_span(span: AgentSpan):
+            # Process input value
+            input_value = span.attributes.get("input.value", "")
+            if input_value:
+                try:
+                    parsed_input = json.loads(input_value)
+                    if isinstance(parsed_input, list) and len(parsed_input) > 0:
+                        input_value = str(parsed_input[-1])
+                except Exception:
+                    pass
+            # Process output value
+            output_value = span.attributes.get("output.value", "")
+            if output_value:
+                try:
+                    parsed_output = json.loads(output_value)
+                    if isinstance(parsed_output, list) and len(parsed_output) > 0:
+                        output_value = str(parsed_output[-1])
+                except Exception:
+                    pass
+            # Truncate long values
+            max_length = 800
+            if len(input_value) > max_length:
+                input_value = f"[Truncated]...{input_value[-max_length:]}"
+            if len(output_value) > max_length:
+                output_value = f"[Truncated]...{output_value[-max_length:]}"
+            # Create a cleaner message format
+            if input_value or output_value:
+                message = f"Step: {span.name}\n"
+                if input_value:
+                    message += f"Input: {input_value}\n"
+                if output_value:
+                    message += f"Output: {output_value}"
+            else:
+                message = f"Step: {span.name}\n{span}"
+            status.update(label=message, expanded=False, state="running")
+        export_logs(agent, update_span)
+        start_time = time.time()
         agent_trace: AgentTrace = await agent.run_async(query, **kwargs)
+        status.update(label="Finished!", expanded=False, state="complete")
+        end_time = time.time()
+        agent.exit()
+        execution_time = end_time - start_time
+        return agent_trace, execution_time