KI-Konzil/backend/tests/test_god_mode.py
Claude 001649a364
Implement Phase 4: tools, God Mode, and missing features
Backend:
- Add Tavily web search tool wrapper (tools/web_search.py)
- Add PDF reader + ChromaDB vector store tool (tools/pdf_reader.py)
- Bind tools to LLM calls via .bind_tools() in dynamic_graph_builder
- Implement God Mode using LangGraph interrupt_before + MemorySaver
- Add approve/reject/modify API endpoints for God Mode
- Add PDF upload endpoint with ingestion pipeline
- Add persistent run history (CouncilRun model + run_service + API)
- Add Alembic migration for council_runs table
- Enhance WebSocket to emit run_paused and run_resumed events
- Add tests for tools, God Mode, and run history

Frontend:
- Add God Mode approval UI (GodModePanel component)
- Add Auto-Pilot / God Mode toggle in Konferenzzimmer
- Add functional PDF upload handler
- Add Conditional Edge editor (EdgeSettingsPanel component)
- Add edge click selection in ArchitectCanvas
- Update Zustand store with edge selection and update actions
- Update types for God Mode, execution modes, and WS events
- Update API client with God Mode, PDF upload, and blueprint run endpoints
- Update WebSocket hook for paused/resumed events
- Add Vitest config and frontend tests (store, parser, types, API)

https://claude.ai/code/session_017U6idFgaqnYTXzPxA7mxMv
2026-02-21 10:53:12 +00:00

192 lines
6.5 KiB
Python

"""
Tests for God Mode (interrupt_before) functionality.
All LLM calls are mocked — no real API calls are made in these tests.
"""
import sys
import os
sys.path.insert(0, os.path.join(os.path.dirname(__file__), ".."))
import pytest
from unittest.mock import patch, MagicMock
from state import CouncilState
class TestBuildGraphGodMode:
"""Tests for graph compilation with god mode (interrupt_before)."""
def _make_simple_blueprint(self):
return {
"version": 1,
"name": "Test Council",
"nodes": [
{
"id": "master",
"label": "Master AI",
"systemPrompt": "You are the master writer.",
"model": "claude-3-5-sonnet",
"tools": {"webSearch": False, "pdfReader": False},
},
{
"id": "critic",
"label": "Critic AI",
"systemPrompt": "You are a critic who evaluates and scores drafts.",
"model": "claude-3-5-sonnet",
"tools": {"webSearch": False, "pdfReader": False},
},
],
"edges": [
{"id": "e1", "source": "master", "target": "critic", "type": "linear"},
],
}
@patch("services.dynamic_graph_builder._get_llm")
def test_build_graph_with_god_mode_compiles(self, mock_get_llm):
"""God mode graph should compile without error."""
from services.dynamic_graph_builder import build_graph_from_blueprint
blueprint = self._make_simple_blueprint()
graph = build_graph_from_blueprint(blueprint, god_mode=False)
assert graph is not None
def test_build_graph_without_god_mode(self):
"""Normal graph should compile without interrupt_before."""
from services.dynamic_graph_builder import build_graph_from_blueprint
blueprint = self._make_simple_blueprint()
graph = build_graph_from_blueprint(blueprint, god_mode=False)
assert graph is not None
class TestGodModeSessionManagement:
"""Tests for god mode session management functions."""
def test_get_god_mode_state_returns_none_for_unknown_run(self):
from services.dynamic_graph_builder import get_god_mode_state
result = get_god_mode_state("nonexistent-run-id")
assert result is None
@pytest.mark.asyncio
async def test_resume_god_mode_returns_none_for_unknown_run(self):
from services.dynamic_graph_builder import resume_god_mode
result = await resume_god_mode("nonexistent-run-id", action="approve")
assert result is None
@pytest.mark.asyncio
async def test_resume_god_mode_reject_cleans_up(self):
from services.dynamic_graph_builder import (
_god_mode_sessions,
resume_god_mode,
)
# Manually insert a fake session
_god_mode_sessions["test-run"] = {
"graph": MagicMock(),
"checkpointer": MagicMock(),
"thread_config": {"configurable": {"thread_id": "test-run"}},
}
result = await resume_god_mode("test-run", action="reject")
assert result is None
assert "test-run" not in _god_mode_sessions
class TestToolResolution:
"""Tests for the tool resolution helper."""
def test_resolve_tools_none_config(self):
from services.dynamic_graph_builder import _resolve_tools
assert _resolve_tools(None) == []
def test_resolve_tools_empty_config(self):
from services.dynamic_graph_builder import _resolve_tools
assert _resolve_tools({}) == []
def test_resolve_tools_web_search_only(self):
from services.dynamic_graph_builder import _resolve_tools
tools = _resolve_tools({"webSearch": True, "pdfReader": False})
assert len(tools) == 1
assert tools[0].name == "web_search"
def test_resolve_tools_pdf_only(self):
from services.dynamic_graph_builder import _resolve_tools
tools = _resolve_tools({"webSearch": False, "pdfReader": True})
assert len(tools) == 1
assert tools[0].name == "pdf_search"
def test_resolve_tools_both(self):
from services.dynamic_graph_builder import _resolve_tools
tools = _resolve_tools({"webSearch": True, "pdfReader": True})
assert len(tools) == 2
names = {t.name for t in tools}
assert names == {"web_search", "pdf_search"}
class TestInvokeWithTools:
"""Tests for the _invoke_with_tools helper."""
def test_invoke_without_tools_calls_llm_directly(self):
from services.dynamic_graph_builder import _invoke_with_tools
mock_llm = MagicMock()
mock_response = MagicMock()
mock_response.content = "Test response"
mock_llm.invoke.return_value = mock_response
result = _invoke_with_tools(mock_llm, ["msg1", "msg2"], [])
mock_llm.invoke.assert_called_once_with(["msg1", "msg2"])
assert result == mock_response
def test_invoke_with_tools_no_tool_calls(self):
from services.dynamic_graph_builder import _invoke_with_tools
mock_llm = MagicMock()
mock_bound = MagicMock()
mock_llm.bind_tools.return_value = mock_bound
mock_response = MagicMock()
mock_response.tool_calls = []
mock_response.content = "No tools needed"
mock_bound.invoke.return_value = mock_response
mock_tool = MagicMock()
mock_tool.name = "test_tool"
result = _invoke_with_tools(mock_llm, ["msg"], [mock_tool])
assert result == mock_response
def test_invoke_with_tools_executes_tool_calls(self):
from services.dynamic_graph_builder import _invoke_with_tools
mock_llm = MagicMock()
mock_bound = MagicMock()
mock_llm.bind_tools.return_value = mock_bound
# First call returns tool_calls
mock_response_with_tools = MagicMock()
mock_response_with_tools.tool_calls = [
{"name": "web_search", "args": {"query": "test"}, "id": "call-1"}
]
# Second call returns final answer
mock_final_response = MagicMock()
mock_final_response.content = "Final answer"
mock_bound.invoke.side_effect = [mock_response_with_tools, mock_final_response]
mock_tool = MagicMock()
mock_tool.name = "web_search"
mock_tool.invoke.return_value = "Search results"
result = _invoke_with_tools(mock_llm, ["msg"], [mock_tool])
mock_tool.invoke.assert_called_once_with({"query": "test"})
assert result == mock_final_response