chatfed_orchestrator

Sleeping

App Files Files Community

ppsingh commited on Jul 15

Commit

fcc054f

verified ·

1 Parent(s): 1b0f717

Create app.py

Browse files

Files changed (1) hide show

app.py +231 -0

app.py ADDED Viewed

	@@ -0,0 +1,231 @@

+import gradio as gr
+from gradio_client import Client
+from langgraph.graph import StateGraph, START, END
+from typing import TypedDict, Optional
+import io
+from PIL import Image
+import os
+#OPEN QUESTION: SHOULD WE PASS ALL PARAMS FROM THE ORCHESTRATOR TO THE NODES INSTEAD OF SETTING IN EACH MODULE?
+HF_TOKEN = os.environ.get("HF_TOKEN")
+import configparser
+import logging
+import os
+import ast
+import re
+from dotenv import load_dotenv
+# Local .env file
+load_dotenv()
+def getconfig(configfile_path: str):
+    """
+    Read the config file
+    Params
+    ----------------
+    configfile_path: file path of .cfg file
+    """
+    config = configparser.ConfigParser()
+    try:
+        config.read_file(open(configfile_path))
+        return config
+    except:
+        logging.warning("config file not found")
+def get_auth(provider: str) -> dict:
+    """Get authentication configuration for different providers"""
+    auth_configs = {
+        "huggingface": {"api_key": os.getenv("HF_TOKEN")},
+        "qdrant": {"api_key": os.getenv("QDRANT_API_KEY")},
+    }
+    provider = provider.lower()  # Normalize to lowercase
+    if provider not in auth_configs:
+        raise ValueError(f"Unsupported provider: {provider}")
+    auth_config = auth_configs[provider]
+    api_key = auth_config.get("api_key")
+    if not api_key:
+        logging.warning(f"No API key found for provider '{provider}'. Please set the appropriate environment variable.")
+        auth_config["api_key"] = None
+    return auth_config
+# Define the state schema
+class GraphState(TypedDict):
+    query: str
+    context: str
+    result: str
+    # Add orchestrator-level parameters (addressing your open question)
+    reports_filter: str
+    sources_filter: str
+    subtype_filter: str
+    year_filter: str
+# node 2: retriever
+def retrieve_node(state: GraphState) -> GraphState:
+    client = Client("giz/chatfed_retriever", hf_token=HF_TOKEN)  # HF repo name
+    context = client.predict(
+        query=state["query"],
+        reports_filter=state.get("reports_filter", ""),
+        sources_filter=state.get("sources_filter", ""),
+        subtype_filter=state.get("subtype_filter", ""),
+        year_filter=state.get("year_filter", ""),
+        api_name="/retrieve"
+    )
+    return {"context": context}
+# node 3: generator
+def generate_node(state: GraphState) -> GraphState:
+    client = Client("giz/chatfed_generator", hf_token=HF_TOKEN)
+    result = client.predict(
+        query=state["query"],
+        context=state["context"],
+        api_name="/generate"
+    )
+    return {"result": result}
+# build the graph
+workflow = StateGraph(GraphState)
+# Add nodes
+workflow.add_node("retrieve", retrieve_node)
+workflow.add_node("generate", generate_node)
+# Add edges
+workflow.add_edge(START, "retrieve")
+workflow.add_edge("retrieve", "generate")
+workflow.add_edge("generate", END)
+# Compile the graph
+graph = workflow.compile()
+# Single tool for processing queries
+def process_query(
+    query: str,
+    reports_filter: str = "",
+    sources_filter: str = "",
+    subtype_filter: str = "",
+    year_filter: str = ""
+) -> str:
+    """
+    Execute the ChatFed orchestration pipeline to process a user query.
+    This function orchestrates a two-step workflow:
+    1. Retrieve relevant context using the ChatFed retriever service with optional filters
+    2. Generate a response using the ChatFed generator service with the retrieved context
+    Args:
+        query (str): The user's input query/question to be processed
+        reports_filter (str, optional): Filter for specific report types. Defaults to "".
+        sources_filter (str, optional): Filter for specific data sources. Defaults to "".
+        subtype_filter (str, optional): Filter for document subtypes. Defaults to "".
+        year_filter (str, optional): Filter for specific years. Defaults to "".
+    Returns:
+        str: The generated response from the ChatFed generator service
+    """
+    initial_state = {
+        "query": query,
+        "context": "",
+        "result": "",
+        "reports_filter": reports_filter or "",
+        "sources_filter": sources_filter or "",
+        "subtype_filter": subtype_filter or "",
+        "year_filter": year_filter or ""
+    }
+    final_state = graph.invoke(initial_state)
+    return final_state["result"]
+# Simple testing interface
+ui = gr.Interface(
+    fn=process_query,
+    inputs=gr.Textbox(lines=2, placeholder="Enter query here"),
+    outputs="text",
+    flagging_mode="never"
+)
+# Add a function to generate the graph visualization
+def get_graph_visualization():
+    """Generate and return the LangGraph workflow visualization as a PIL Image."""
+    # Generate the graph as PNG bytes
+    graph_png_bytes = graph.get_graph().draw_mermaid_png()
+    # Convert bytes to PIL Image for Gradio display
+    graph_image = Image.open(io.BytesIO(graph_png_bytes))
+    return graph_image
+# Guidance for ChatUI - can be removed later. Questionable whether front end even necessary. Maybe nice to show the graph.
+with gr.Blocks(title="ChatFed Orchestrator") as demo:
+    gr.Markdown("# ChatFed Orchestrator")
+    gr.Markdown("This LangGraph server exposes MCP endpoints for the ChatUI module to call (which triggers the graph).")
+    with gr.Row():
+        # Left column - Graph visualization
+        with gr.Column(scale=1):
+            gr.Markdown("**Workflow Visualization**")
+            graph_display = gr.Image(
+                value=get_graph_visualization(),
+                label="LangGraph Workflow",
+                interactive=False,
+                height=300
+            )
+            # Add a refresh button for the graph
+            refresh_graph_btn = gr.Button("🔄 Refresh Graph", size="sm")
+            refresh_graph_btn.click(
+                fn=get_graph_visualization,
+                outputs=graph_display
+            )
+        # Right column - Interface and documentation
+        with gr.Column(scale=2):
+            gr.Markdown("**Available MCP Tools:**")
+            with gr.Accordion("MCP Endpoint Information", open=True):
+                gr.Markdown(f"""
+                **MCP Server Endpoint:** https://giz-chatfed-orchestrator.hf.space/gradio_api/mcp/sse
+                **For ChatUI Integration:**
+                ```python
+                from gradio_client import Client
+                # Connect to orchestrator
+                orchestrator_client = Client("https://giz-chatfed-orchestrator.hf.space")
+                # Basic usage (no filters)
+                response = orchestrator_client.predict(
+                    query="query",
+                    api_name="/process_query"
+                )
+                # Advanced usage with any combination of filters
+                response = orchestrator_client.predict(
+                    query="query",
+                    reports_filter="annual_reports",
+                    sources_filter="internal",
+                    year_filter="2024",
+                    api_name="/process_query"
+                )
+                ```
+                """)
+    with gr.Accordion("Quick Testing Interface", open=True):
+        ui.render()
+if __name__ == "__main__":
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        mcp_server=True,
+        show_error=True
+    )