Implement Phase 4: tools, God Mode, and missing features

Backend: - Add Tavily web search tool wrapper (tools/web_search.py) - Add PDF reader + ChromaDB vector store tool (tools/pdf_reader.py) - Bind tools to LLM calls via .bind_tools() in dynamic_graph_builder - Implement God Mode using LangGraph interrupt_before + MemorySaver - Add approve/reject/modify API endpoints for God Mode - Add PDF upload endpoint with ingestion pipeline - Add persistent run history (CouncilRun model + run_service + API) - Add Alembic migration for council_runs table - Enhance WebSocket to emit run_paused and run_resumed events - Add tests for tools, God Mode, and run history Frontend: - Add God Mode approval UI (GodModePanel component) - Add Auto-Pilot / God Mode toggle in Konferenzzimmer - Add functional PDF upload handler - Add Conditional Edge editor (EdgeSettingsPanel component) - Add edge click selection in ArchitectCanvas - Update Zustand store with edge selection and update actions - Update types for God Mode, execution modes, and WS events - Update API client with God Mode, PDF upload, and blueprint run endpoints - Update WebSocket hook for paused/resumed events - Add Vitest config and frontend tests (store, parser, types, API) https://claude.ai/code/session_017U6idFgaqnYTXzPxA7mxMv
2026-02-21 10:53:12 +00:00 · 2026-02-21 10:53:12 +00:00 · 001649a364
commit 001649a364
parent c6d0c4a636
31 changed files with 2502 additions and 81 deletions
--- a/backend/services/dynamic_graph_builder.py
+++ b/backend/services/dynamic_graph_builder.py
@ -5,6 +5,11 @@ This is the Phase 3 replacement for the hard-coded graph in graph_builder.py.
 It reads a CouncilBlueprint JSON (as produced by the frontend parser) and
 dynamically constructs the LangGraph StateGraph with the correct nodes,
 edges, and conditional routing.
+
+Phase 4 additions:
+- Tool binding: agents with tools enabled (webSearch, pdfReader) get
+  LangChain tools bound to their LLM via .bind_tools().
+- God Mode: supports interrupt_before for human-in-the-loop approval.
 """

 import asyncio
@ -17,6 +22,8 @@ from langchain_openai import ChatOpenAI
 from langgraph.graph import END, StateGraph

 from state import CouncilState, APPROVAL_THRESHOLD, MAX_ITERATIONS
+from tools.web_search import web_search
+from tools.pdf_reader import pdf_search


 # ---------------------------------------------------------------------------
@ -50,6 +57,78 @@ def _get_llm(model_name: str) -> Any:
    return factory()


+# ---------------------------------------------------------------------------
+# Tool resolution
+# ---------------------------------------------------------------------------
+
+def _resolve_tools(tools_config: Optional[dict]) -> list:
+    """
+    Resolve a node's tools config to a list of LangChain tool objects.
+
+    Args:
+        tools_config: Dict like {"webSearch": true, "pdfReader": true}
+
+    Returns:
+        A list of LangChain tool objects to bind to the LLM.
+    """
+    if not tools_config:
+        return []
+
+    resolved = []
+    if tools_config.get("webSearch"):
+        resolved.append(web_search)
+    if tools_config.get("pdfReader"):
+        resolved.append(pdf_search)
+    return resolved
+
+
+def _invoke_with_tools(llm: Any, messages: list, tools: list) -> Any:
+    """
+    Invoke an LLM, optionally with tools bound. If the LLM returns tool
+    calls, execute them and feed results back for a final answer.
+
+    Args:
+        llm: A LangChain chat model instance.
+        messages: The message list to send.
+        tools: List of LangChain tools (may be empty).
+
+    Returns:
+        The final LLM response message.
+    """
+    if not tools:
+        return llm.invoke(messages)
+
+    llm_with_tools = llm.bind_tools(tools)
+    response = llm_with_tools.invoke(messages)
+
+    # If no tool calls, return directly
+    if not response.tool_calls:
+        return response
+
+    # Execute tool calls and collect results
+    from langchain_core.messages import ToolMessage
+
+    tool_map = {t.name: t for t in tools}
+    tool_messages = [response]
+
+    for tc in response.tool_calls:
+        tool_fn = tool_map.get(tc["name"])
+        if tool_fn:
+            try:
+                result = tool_fn.invoke(tc["args"])
+            except Exception as exc:  # noqa: BLE001
+                result = f"[Tool Error] {exc}"
+        else:
+            result = f"[Tool Error] Unknown tool: {tc['name']}"
+
+        tool_messages.append(
+            ToolMessage(content=str(result), tool_call_id=tc["id"])
+        )
+
+    # Final LLM call with tool results
+    return llm_with_tools.invoke(messages + tool_messages)
+
+
 # ---------------------------------------------------------------------------
 # Generic agent node factory
 # ---------------------------------------------------------------------------
@ -59,6 +138,7 @@ def _make_agent_node(
    label: str,
    system_prompt: str,
    model_name: str,
+    tools_config: Optional[dict] = None,
 ) -> Callable[[CouncilState], dict]:
    """
    Create a LangGraph node function for a user-defined agent.
@ -71,10 +151,12 @@ def _make_agent_node(
        label:         Display name of the agent (used in prompts).
        system_prompt: The persona / role definition for this agent.
        model_name:    Which LLM to use ("claude-3-5-sonnet" | "gpt-4o").
+        tools_config:  Optional dict like {"webSearch": true, "pdfReader": true}.

    Returns:
        A callable (CouncilState) -> dict suitable for StateGraph.add_node().
    """
+    node_tools = _resolve_tools(tools_config)

    def agent_node(state: CouncilState) -> dict:
        llm = _get_llm(model_name)
@ -105,7 +187,7 @@ def _make_agent_node(

        system_msg = SystemMessage(content=system_prompt)
        user_msg = HumanMessage(content=user_content)
-        response = llm.invoke([system_msg, user_msg])
+        response = _invoke_with_tools(llm, [system_msg, user_msg], node_tools)

        return {
            "current_draft": response.content,
@ -177,6 +259,7 @@ def _make_critic_node(
    label: str,
    system_prompt: str,
    model_name: str,
+    tools_config: Optional[dict] = None,
 ) -> Callable[[CouncilState], dict]:
    """
    Create a critic-style node that scores and routes.
@ -186,6 +269,8 @@ def _make_critic_node(
    """
    import re

+    node_tools = _resolve_tools(tools_config)
+
    critic_system = (
        system_prompt + "\n\n"
        "IMPORTANT: You must respond in EXACTLY this format:\n\n"
@ -219,7 +304,7 @@ def _make_critic_node(
            )
        )

-        response = llm.invoke([system_msg, user_msg])
+        response = _invoke_with_tools(llm, [system_msg, user_msg], node_tools)

        # Parse structured response
        score_match = re.search(r"SCORE:\s*(\d+(?:\.\d+)?)", response.content)
@ -251,7 +336,10 @@ def _make_critic_node(
 # Main: build graph from blueprint JSON
 # ---------------------------------------------------------------------------

-def build_graph_from_blueprint(blueprint: dict) -> Any:
+def build_graph_from_blueprint(
+    blueprint: dict,
+    god_mode: bool = False,
+) -> Any:
    """
    Dynamically construct a compiled LangGraph from a CouncilBlueprint JSON.

@ -263,6 +351,8 @@ def build_graph_from_blueprint(blueprint: dict) -> Any:
                "nodes": [{"id", "label", "systemPrompt", "model", "tools", "position"}],
                "edges": [{"id", "source", "target", "type", "condition?"}]
            }
+        god_mode: If True, compile with interrupt_before on all nodes so the
+                  user can approve/reject at each step (Human-in-the-Loop).

    Returns:
        A compiled LangGraph StateGraph ready for invocation.
@ -295,16 +385,23 @@ def build_graph_from_blueprint(blueprint: dict) -> Any:
    graph = StateGraph(CouncilState)

    # Register all nodes
+    all_node_ids = []
    for node in nodes:
        nid = node["id"]
+        all_node_ids.append(nid)
        label = node.get("label", nid)
        system_prompt = node.get("systemPrompt", f"You are {label}.")
        model_name = node.get("model", "claude-3-5-sonnet")
+        tools_config = node.get("tools")

        if _is_critic_like(system_prompt):
-            node_fn = _make_critic_node(nid, label, system_prompt, model_name)
+            node_fn = _make_critic_node(
+                nid, label, system_prompt, model_name, tools_config
+            )
        else:
-            node_fn = _make_agent_node(nid, label, system_prompt, model_name)
+            node_fn = _make_agent_node(
+                nid, label, system_prompt, model_name, tools_config
+            )

        graph.add_node(nid, node_fn)

@ -349,6 +446,10 @@ def build_graph_from_blueprint(blueprint: dict) -> Any:
        if tid not in edges_by_source:
            graph.add_edge(tid, END)

+    # God Mode: interrupt before every node so the user can approve/reject
+    if god_mode:
+        return graph.compile(interrupt_before=all_node_ids)
+
    return graph.compile()


@ -356,20 +457,65 @@ async def run_blueprint_council_async(
    blueprint: dict,
    input_topic: str,
    run_id: str,
+    god_mode: bool = False,
    on_node_event: Optional[Callable[[str, str], Any]] = None,
 ) -> CouncilState:
    """
    Execute a council run using a dynamically built graph from a blueprint.

+    In auto-pilot mode, the graph runs to completion.
+    In god mode, the graph pauses before each node via interrupt_before,
+    allowing human approval through the resume mechanism.
+
    Args:
        blueprint:     The CouncilBlueprint JSON dict.
        input_topic:   The user's prompt.
        run_id:        Unique identifier for this run.
+        god_mode:      If True, pause before each node for human approval.
        on_node_event: Optional callback for WebSocket node events.

    Returns:
        The final CouncilState after execution completes.
    """
+    from langgraph.checkpoint.memory import MemorySaver
+
+    if god_mode:
+        checkpointer = MemorySaver()
+        nodes_list = blueprint.get("nodes", [])
+        all_node_ids = [n["id"] for n in nodes_list]
+        compiled_graph = _build_graph_with_checkpointer(
+            blueprint, checkpointer, all_node_ids
+        )
+
+        initial_state = CouncilState(
+            input_topic=input_topic,
+            current_draft="",
+            feedback_history=[],
+            route_decision="",
+            messages=[],
+            iteration_count=0,
+            critic_score=None,
+            run_id=run_id,
+            active_node="",
+        )
+
+        thread_config = {"configurable": {"thread_id": run_id}}
+
+        loop = asyncio.get_event_loop()
+        state = await loop.run_in_executor(
+            None,
+            lambda: compiled_graph.invoke(initial_state, config=thread_config),
+        )
+
+        # Store the graph and checkpointer for later resume
+        _god_mode_sessions[run_id] = {
+            "graph": compiled_graph,
+            "checkpointer": checkpointer,
+            "thread_config": thread_config,
+        }
+
+        return state
+
    compiled_graph = build_graph_from_blueprint(blueprint)

    initial_state = CouncilState(
@ -391,3 +537,153 @@ async def run_blueprint_council_async(
    )

    return final_state
+
+
+# ---------------------------------------------------------------------------
+# God Mode session management
+# ---------------------------------------------------------------------------
+
+# In-memory store for active god mode sessions (graph + checkpointer)
+_god_mode_sessions: Dict[str, dict] = {}
+
+
+def _build_graph_with_checkpointer(
+    blueprint: dict,
+    checkpointer: Any,
+    interrupt_node_ids: List[str],
+) -> Any:
+    """Build a compiled graph with a checkpointer for god mode."""
+    nodes = blueprint.get("nodes", [])
+    edges = blueprint.get("edges", [])
+
+    if not nodes:
+        raise ValueError("Blueprint has no nodes.")
+
+    node_lookup = {n["id"]: n for n in nodes}
+    targets = {e["target"] for e in edges}
+    entry_candidates = [n["id"] for n in nodes if n["id"] not in targets]
+    if not entry_candidates:
+        entry_candidates = [nodes[0]["id"]]
+    entry_node_id = entry_candidates[0]
+
+    sources = {e["source"] for e in edges}
+    terminal_nodes = {n["id"] for n in nodes if n["id"] not in sources}
+
+    graph = StateGraph(CouncilState)
+
+    for node in nodes:
+        nid = node["id"]
+        label = node.get("label", nid)
+        system_prompt = node.get("systemPrompt", f"You are {label}.")
+        model_name = node.get("model", "claude-3-5-sonnet")
+        tools_config = node.get("tools")
+
+        if _is_critic_like(system_prompt):
+            node_fn = _make_critic_node(
+                nid, label, system_prompt, model_name, tools_config
+            )
+        else:
+            node_fn = _make_agent_node(
+                nid, label, system_prompt, model_name, tools_config
+            )
+
+        graph.add_node(nid, node_fn)
+
+    graph.set_entry_point(entry_node_id)
+
+    edges_by_source: Dict[str, Dict[str, list]] = {}
+    for edge in edges:
+        src = edge["source"]
+        if src not in edges_by_source:
+            edges_by_source[src] = {"linear": [], "conditional": []}
+        if edge.get("type") == "conditional":
+            edges_by_source[src]["conditional"].append(edge)
+        else:
+            edges_by_source[src]["linear"].append(edge)
+
+    for source_id, grouped in edges_by_source.items():
+        linear = grouped["linear"]
+        conditional = grouped["conditional"]
+
+        if conditional:
+            linear_target = linear[0]["target"] if linear else None
+            router = _make_conditional_router(source_id, conditional, linear_target)
+            route_map: Dict[str, str] = {}
+            for ce in conditional:
+                route_map[ce["target"]] = ce["target"]
+            if linear_target:
+                route_map[linear_target] = linear_target
+            graph.add_conditional_edges(source_id, router, route_map)
+        elif linear:
+            graph.add_edge(source_id, linear[0]["target"])
+
+    for tid in terminal_nodes:
+        if tid not in edges_by_source:
+            graph.add_edge(tid, END)
+
+    return graph.compile(
+        checkpointer=checkpointer,
+        interrupt_before=interrupt_node_ids,
+    )
+
+
+async def resume_god_mode(
+    run_id: str,
+    action: str = "approve",
+    modified_state: Optional[dict] = None,
+) -> Optional[CouncilState]:
+    """
+    Resume a paused god mode run after human approval.
+
+    Args:
+        run_id:         The run ID of the paused session.
+        action:         "approve" to continue, "reject" to stop.
+        modified_state: Optional partial state override (for "modify" action).
+
+    Returns:
+        The next CouncilState (may be another interrupt or final).
+        None if the run_id is not found.
+    """
+    session = _god_mode_sessions.get(run_id)
+    if not session:
+        return None
+
+    if action == "reject":
+        _god_mode_sessions.pop(run_id, None)
+        return None
+
+    compiled_graph = session["graph"]
+    thread_config = session["thread_config"]
+
+    if modified_state:
+        compiled_graph.update_state(thread_config, modified_state)
+
+    loop = asyncio.get_event_loop()
+    state = await loop.run_in_executor(
+        None,
+        lambda: compiled_graph.invoke(None, config=thread_config),
+    )
+
+    # If state indicates completion, clean up
+    if state and state.get("route_decision") == "done":
+        _god_mode_sessions.pop(run_id, None)
+
+    return state
+
+
+def get_god_mode_state(run_id: str) -> Optional[dict]:
+    """Get the current state of a paused god mode session."""
+    session = _god_mode_sessions.get(run_id)
+    if not session:
+        return None
+
+    graph = session["graph"]
+    thread_config = session["thread_config"]
+    snapshot = graph.get_state(thread_config)
+
+    return {
+        "run_id": run_id,
+        "paused": bool(snapshot.next),
+        "next_nodes": list(snapshot.next) if snapshot.next else [],
+        "current_state": dict(snapshot.values) if snapshot.values else {},
+    }