test(02-02): add failing tool registry and executor unit tests

- Tests for BUILTIN_TOOLS (4 tools present, correct fields, confirmation flags) - Tests for get_tools_for_agent filtering and to_litellm_format conversion - Tests for execute_tool: valid args, invalid args, unknown tool, confirmation flow - Tests for audit logger called on every invocation
2026-03-23 14:51:42 -06:00
parent 4047b552a7
commit 420294b8fe
2 changed files with 434 additions and 0 deletions
--- a/tests/unit/test_tool_executor.py
+++ b/tests/unit/test_tool_executor.py
@@ -0,0 +1,285 @@
+"""
+Unit tests for the tool executor.
+
+Tests:
+  - Valid args pass schema validation and handler is called
+  - Invalid args are rejected before the handler is called
+  - Unknown tool name raises ValueError
+  - requires_confirmation=True returns confirmation message without executing
+  - audit_logger.log_tool_call is called on every invocation
+"""
+
+from __future__ import annotations
+
+import uuid
+from unittest.mock import AsyncMock, MagicMock, patch
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def make_registry(requires_confirmation: bool = False, handler_return: str = "tool result") -> dict:
+    """Build a minimal tool registry for testing."""
+    from orchestrator.tools.registry import ToolDefinition
+
+    async def mock_handler(**kwargs: object) -> str:
+        return handler_return
+
+    return {
+        "test_tool": ToolDefinition(
+            name="test_tool",
+            description="A test tool",
+            parameters={
+                "type": "object",
+                "properties": {
+                    "query": {"type": "string"},
+                    "count": {"type": "integer"},
+                },
+                "required": ["query"],
+            },
+            requires_confirmation=requires_confirmation,
+            handler=mock_handler,
+        )
+    }
+
+
+def make_audit_logger() -> MagicMock:
+    """Return a mock AuditLogger."""
+    mock = MagicMock()
+    mock.log_tool_call = AsyncMock()
+    return mock
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+
+class TestExecuteToolValidArgs:
+    """execute_tool with valid args calls the handler and returns result."""
+
+    async def test_valid_args_returns_result(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry(handler_return="search results here")
+        audit_logger = make_audit_logger()
+
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{"query": "hello world"}',
+            }
+        }
+
+        result = await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        assert result == "search results here"
+
+    async def test_audit_logger_called_on_success(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry()
+        audit_logger = make_audit_logger()
+
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{"query": "test"}',
+            }
+        }
+
+        await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        audit_logger.log_tool_call.assert_called_once()
+        call_kwargs = audit_logger.log_tool_call.call_args[1]
+        assert call_kwargs["tool_name"] == "test_tool"
+        assert call_kwargs["error"] is None
+
+
+class TestExecuteToolInvalidArgs:
+    """execute_tool with invalid args rejects before calling handler."""
+
+    async def test_missing_required_arg_returns_error(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry()
+        audit_logger = make_audit_logger()
+
+        # 'query' is required but not provided
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{"count": 5}',
+            }
+        }
+
+        result = await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        assert "error" in result.lower() or "invalid" in result.lower() or "required" in result.lower()
+
+    async def test_wrong_type_returns_error(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry()
+        audit_logger = make_audit_logger()
+
+        # count should be integer but string provided
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{"query": "hello", "count": "not_a_number"}',
+            }
+        }
+
+        result = await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        assert "error" in result.lower() or "invalid" in result.lower()
+
+    async def test_audit_logger_called_with_error_on_invalid_args(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry()
+        audit_logger = make_audit_logger()
+
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{}',  # Missing required 'query'
+            }
+        }
+
+        await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        audit_logger.log_tool_call.assert_called_once()
+        call_kwargs = audit_logger.log_tool_call.call_args[1]
+        assert call_kwargs["error"] is not None
+
+
+class TestExecuteToolUnknownTool:
+    """execute_tool with unknown tool name returns an error string."""
+
+    async def test_unknown_tool_returns_error(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry()
+        audit_logger = make_audit_logger()
+
+        tool_call = {
+            "function": {
+                "name": "nonexistent_tool",
+                "arguments": "{}",
+            }
+        }
+
+        result = await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        assert "unknown" in result.lower() or "not found" in result.lower() or "error" in result.lower()
+
+
+class TestExecuteToolConfirmation:
+    """execute_tool with requires_confirmation=True returns confirmation message."""
+
+    async def test_confirmation_required_returns_confirmation_message(self):
+        from orchestrator.tools.executor import execute_tool
+
+        registry = make_registry(requires_confirmation=True)
+        audit_logger = make_audit_logger()
+
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{"query": "confirm this"}',
+            }
+        }
+
+        result = await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        # Should return a confirmation message, not the tool result
+        assert "confirm" in result.lower() or "permission" in result.lower() or "approval" in result.lower()
+
+    async def test_confirmation_required_does_not_call_handler(self):
+        """Handler must NOT be called when requires_confirmation=True."""
+        from orchestrator.tools.registry import ToolDefinition
+
+        handler_called = False
+
+        async def tracking_handler(**kwargs: object) -> str:
+            nonlocal handler_called
+            handler_called = True
+            return "should not be called"
+
+        registry = {
+            "test_tool": ToolDefinition(
+                name="test_tool",
+                description="A test tool",
+                parameters={
+                    "type": "object",
+                    "properties": {"query": {"type": "string"}},
+                    "required": ["query"],
+                },
+                requires_confirmation=True,
+                handler=tracking_handler,
+            )
+        }
+        audit_logger = make_audit_logger()
+
+        tool_call = {
+            "function": {
+                "name": "test_tool",
+                "arguments": '{"query": "test"}',
+            }
+        }
+
+        await execute_tool(
+            tool_call=tool_call,
+            registry=registry,
+            tenant_id=uuid.uuid4(),
+            agent_id=uuid.uuid4(),
+            audit_logger=audit_logger,
+        )
+
+        assert not handler_called, "Handler should not be called when requires_confirmation=True"
--- a/tests/unit/test_tool_registry.py
+++ b/tests/unit/test_tool_registry.py
@@ -0,0 +1,149 @@
+"""
+Unit tests for the tool registry.
+
+Tests:
+  - BUILTIN_TOOLS contains all 4 expected tools
+  - get_tools_for_agent filters correctly based on agent.tool_assignments
+  - to_litellm_format produces valid OpenAI function-calling schema
+  - ToolDefinition model validation
+"""
+
+from __future__ import annotations
+
+import uuid
+from unittest.mock import MagicMock
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def make_agent(tool_list: list[str]) -> MagicMock:
+    """Create a mock Agent with tool_assignments set."""
+    agent = MagicMock()
+    agent.id = uuid.uuid4()
+    agent.tool_assignments = tool_list
+    return agent
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+
+class TestBuiltinTools:
+    """BUILTIN_TOOLS registry contains the correct tool definitions."""
+
+    def test_all_four_tools_present(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS
+
+        assert "web_search" in BUILTIN_TOOLS
+        assert "kb_search" in BUILTIN_TOOLS
+        assert "http_request" in BUILTIN_TOOLS
+        assert "calendar_lookup" in BUILTIN_TOOLS
+
+    def test_tool_definitions_have_required_fields(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS
+
+        for name, tool in BUILTIN_TOOLS.items():
+            assert tool.name == name, f"Tool name mismatch for {name}"
+            assert tool.description, f"Tool {name} missing description"
+            assert isinstance(tool.parameters, dict), f"Tool {name} parameters must be dict"
+            assert "type" in tool.parameters, f"Tool {name} parameters missing 'type' key"
+            assert tool.handler is not None, f"Tool {name} has no handler"
+
+    def test_http_request_requires_confirmation(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS
+
+        assert BUILTIN_TOOLS["http_request"].requires_confirmation is True
+
+    def test_web_search_no_confirmation(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS
+
+        assert BUILTIN_TOOLS["web_search"].requires_confirmation is False
+
+    def test_kb_search_no_confirmation(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS
+
+        assert BUILTIN_TOOLS["kb_search"].requires_confirmation is False
+
+    def test_calendar_lookup_no_confirmation(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS
+
+        assert BUILTIN_TOOLS["calendar_lookup"].requires_confirmation is False
+
+
+class TestGetToolsForAgent:
+    """get_tools_for_agent filters BUILTIN_TOOLS by agent's tool_assignments list."""
+
+    def test_filters_to_assigned_tools(self):
+        from orchestrator.tools.registry import get_tools_for_agent
+
+        agent = make_agent(["web_search", "kb_search"])
+        result = get_tools_for_agent(agent)
+
+        assert set(result.keys()) == {"web_search", "kb_search"}
+
+    def test_empty_tool_list_returns_empty(self):
+        from orchestrator.tools.registry import get_tools_for_agent
+
+        agent = make_agent([])
+        result = get_tools_for_agent(agent)
+
+        assert result == {}
+
+    def test_unknown_tools_ignored_silently(self):
+        """Tools in agent.tool_assignments that don't exist in BUILTIN_TOOLS are skipped."""
+        from orchestrator.tools.registry import get_tools_for_agent
+
+        agent = make_agent(["web_search", "nonexistent_tool"])
+        result = get_tools_for_agent(agent)
+
+        assert "web_search" in result
+        assert "nonexistent_tool" not in result
+
+    def test_all_tools_accessible(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS, get_tools_for_agent
+
+        agent = make_agent(list(BUILTIN_TOOLS.keys()))
+        result = get_tools_for_agent(agent)
+
+        assert set(result.keys()) == set(BUILTIN_TOOLS.keys())
+
+
+class TestToLitellmFormat:
+    """to_litellm_format converts tool definitions to OpenAI function-calling schema."""
+
+    def test_returns_list_of_dicts(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS, to_litellm_format
+
+        result = to_litellm_format({"web_search": BUILTIN_TOOLS["web_search"]})
+
+        assert isinstance(result, list)
+        assert len(result) == 1
+
+    def test_openai_schema_structure(self):
+        """Each entry must have type='function' and a nested function object."""
+        from orchestrator.tools.registry import BUILTIN_TOOLS, to_litellm_format
+
+        result = to_litellm_format({"web_search": BUILTIN_TOOLS["web_search"]})
+        entry = result[0]
+
+        assert entry["type"] == "function"
+        assert "function" in entry
+        func = entry["function"]
+        assert func["name"] == "web_search"
+        assert "description" in func
+        assert "parameters" in func
+
+    def test_empty_tools_returns_empty_list(self):
+        from orchestrator.tools.registry import to_litellm_format
+
+        assert to_litellm_format({}) == []
+
+    def test_multiple_tools_converted(self):
+        from orchestrator.tools.registry import BUILTIN_TOOLS, to_litellm_format
+
+        result = to_litellm_format(BUILTIN_TOOLS)
+        assert len(result) == 4