feat(agent): emit structured _tool_events progress metadata

Extend the existing on_progress callback to carry structured tool-event payloads alongside the plain-text hint, so channels can render rich tool execution state (start/finish/error, arguments, results, file attachments) rather than only the pre-formatted hint string. Changes ------- - AgentLoop._tool_event_start_payload() — builds a version-1 start payload from a ToolCallRequest - AgentLoop._tool_event_result_extras() — extracts files/embeds from a tool result dict - AgentLoop._tool_event_finish_payloads() — maps tool_calls + tool_results + tool_events from AgentHookContext into finish payloads - _LoopHook.before_execute_tools() — passes tool_events=[...] to on_progress together with the existing tool_hint flag - _LoopHook.after_iteration() — emits a second on_progress call with the finish payloads once tool results are available - _bus_progress() — forwards tool_events as _tool_events in OutboundMessage metadata so channel implementations can read them - on_progress type widened to Callable[..., Awaitable[None]] on all public entry points; _cli_progress updated to accept and ignore tool_events The contract is additive: callers that only accept (content, *, tool_hint) continue to work unchanged. Callers that also accept tool_events receive the structured data. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-06-18 16:54:16 +00:00 · 2026-04-23 00:54:23 +01:00 · 2026-04-23 00:54:23 +01:00 · c23d719780
commit c23d719780
parent 185a8fd34d
4 changed files with 194 additions and 6 deletions
--- a/nanobot/agent/loop.py
+++ b/nanobot/agent/loop.py
@ -103,13 +103,18 @@ class _LoopHook(AgentHook):
                if thought:
                    await self._on_progress(thought)
            tool_hint = self._loop._strip_think(self._loop._tool_hint(context.tool_calls))
-            await self._on_progress(tool_hint, tool_hint=True)
+            tool_events = [self._loop._tool_event_start_payload(tc) for tc in context.tool_calls]
            await self._on_progress(tool_hint, tool_hint=True, tool_events=tool_events)
        for tc in context.tool_calls:
            args_str = json.dumps(tc.arguments, ensure_ascii=False)
            logger.info("Tool call: {}({})", tc.name, args_str[:200])
        self._loop._set_tool_context(self._channel, self._chat_id, self._message_id)
    async def after_iteration(self, context: AgentHookContext) -> None:
        if self._on_progress and context.tool_calls and context.tool_events:
            tool_events = self._loop._tool_event_finish_payloads(context)
            if tool_events:
                await self._on_progress("", tool_events=tool_events)
        u = context.usage or {}
        logger.debug(
            "LLM usage: prompt={} completion={} cached={}",
@ -375,6 +380,58 @@ class AgentLoop:
        sub_cancelled = await self.subagents.cancel_by_session(key)
        return cancelled + sub_cancelled
    @staticmethod
    def _tool_event_start_payload(tool_call: Any) -> dict[str, Any]:
        return {
            "version": 1,
            "phase": "start",
            "call_id": str(getattr(tool_call, "id", "") or ""),
            "name": getattr(tool_call, "name", ""),
            "arguments": getattr(tool_call, "arguments", {}) or {},
            "result": None,
            "error": None,
            "files": [],
            "embeds": [],
        }
    @staticmethod
    def _tool_event_result_extras(result: Any) -> tuple[list[Any], list[Any]]:
        if not isinstance(result, dict):
            return [], []
        files = result.get("files") if isinstance(result.get("files"), list) else []
        embeds = result.get("embeds") if isinstance(result.get("embeds"), list) else []
        return files, embeds
    @classmethod
    def _tool_event_finish_payloads(cls, context: AgentHookContext) -> list[dict[str, Any]]:
        payloads: list[dict[str, Any]] = []
        count = min(len(context.tool_calls), len(context.tool_results), len(context.tool_events))
        for idx in range(count):
            tool_call = context.tool_calls[idx]
            result = context.tool_results[idx]
            event = context.tool_events[idx] if isinstance(context.tool_events[idx], dict) else {}
            status = event.get("status")
            phase = "end" if status == "ok" else "error"
            files, embeds = cls._tool_event_result_extras(result)
            payload = {
                "version": 1,
                "phase": phase,
                "call_id": str(getattr(tool_call, "id", "") or ""),
                "name": getattr(tool_call, "name", ""),
                "arguments": getattr(tool_call, "arguments", {}) or {},
                "result": result if phase == "end" else None,
                "error": None,
                "files": files,
                "embeds": embeds,
            }
            if phase == "error":
                if isinstance(result, str) and result.strip():
                    payload["error"] = result.strip()
                else:
                    payload["error"] = str(event.get("detail") or "Tool execution failed")
            payloads.append(payload)
        return payloads
    def _effective_session_key(self, msg: InboundMessage) -> str:
        """Return the session key used for task routing and mid-turn injections."""
        if self._unified_session and not msg.session_key_override:
@ -726,7 +783,7 @@ class AgentLoop:
        self,
        msg: InboundMessage,
        session_key: str | None = None,
-        on_progress: Callable[[str], Awaitable[None]] | None = None,
+        on_progress: Callable[..., Awaitable[None]] | None = None,
        on_stream: Callable[[str], Awaitable[None]] | None = None,
        on_stream_end: Callable[..., Awaitable[None]] | None = None,
        pending_queue: asyncio.Queue | None = None,
@ -833,10 +890,17 @@ class AgentLoop:
            chat_id=msg.chat_id,
        )
-        async def _bus_progress(content: str, *, tool_hint: bool = False) -> None:
+        async def _bus_progress(
            content: str,
            *,
            tool_hint: bool = False,
            tool_events: list[dict[str, Any]] | None = None,
        ) -> None:
            meta = dict(msg.metadata or {})
            meta["_progress"] = True
            meta["_tool_hint"] = tool_hint
            if tool_events:
                meta["_tool_events"] = tool_events
            await self.bus.publish_outbound(
                OutboundMessage(
                    channel=msg.channel,
@ -1137,7 +1201,7 @@ class AgentLoop:
        channel: str = "cli",
        chat_id: str = "direct",
        media: list[str] | None = None,
-        on_progress: Callable[[str], Awaitable[None]] | None = None,
+        on_progress: Callable[..., Awaitable[None]] | None = None,
        on_stream: Callable[[str], Awaitable[None]] | None = None,
        on_stream_end: Callable[..., Awaitable[None]] | None = None,
    ) -> OutboundMessage | None:
--- a/nanobot/cli/commands.py
+++ b/nanobot/cli/commands.py
@ -1028,7 +1028,7 @@ def agent(
    # Shared reference for progress callbacks
    _thinking: ThinkingSpinner | None = None
-    async def _cli_progress(content: str, *, tool_hint: bool = False) -> None:
+    async def _cli_progress(content: str, *, tool_hint: bool = False, **_kwargs: Any) -> None:
        ch = agent_loop.channels_config
        if ch and tool_hint and not ch.send_tool_hints:
            return
--- a/tests/agent/test_loop_progress.py
+++ b/tests/agent/test_loop_progress.py
@ -0,0 +1,125 @@
 """Tests for structured tool-event progress metadata emitted by AgentLoop."""
 from pathlib import Path
 from unittest.mock import AsyncMock, MagicMock
 import pytest
 from nanobot.agent.loop import AgentLoop
 from nanobot.bus.events import InboundMessage
 from nanobot.bus.queue import MessageBus
 from nanobot.providers.base import LLMResponse, ToolCallRequest
 def _make_loop(tmp_path: Path) -> AgentLoop:
    bus = MessageBus()
    provider = MagicMock()
    provider.get_default_model.return_value = "test-model"
    return AgentLoop(bus=bus, provider=provider, workspace=tmp_path, model="test-model")
 class TestToolEventProgress:
    """_run_agent_loop emits structured tool_events via on_progress."""
    @pytest.mark.asyncio
    async def test_start_and_finish_events_emitted(self, tmp_path: Path) -> None:
        loop = _make_loop(tmp_path)
        tool_call = ToolCallRequest(id="call1", name="custom_tool", arguments={"path": "foo.txt"})
        calls = iter([
            LLMResponse(content="Visible", tool_calls=[tool_call]),
            LLMResponse(content="Done", tool_calls=[]),
        ])
        loop.provider.chat_with_retry = AsyncMock(side_effect=lambda *a, **kw: next(calls))
        loop.tools.get_definitions = MagicMock(return_value=[])
        loop.tools.prepare_call = MagicMock(return_value=(None, {"path": "foo.txt"}, None))
        loop.tools.execute = AsyncMock(return_value="ok")
        progress: list[tuple[str, bool, list[dict] | None]] = []
        async def on_progress(
            content: str,
            *,
            tool_hint: bool = False,
            tool_events: list[dict] | None = None,
        ) -> None:
            progress.append((content, tool_hint, tool_events))
        final_content, _, _, _, _ = await loop._run_agent_loop([], on_progress=on_progress)
        assert final_content == "Done"
        assert progress == [
            ("Visible", False, None),
            (
                'custom_tool("foo.txt")',
                True,
                [{
                    "version": 1,
                    "phase": "start",
                    "call_id": "call1",
                    "name": "custom_tool",
                    "arguments": {"path": "foo.txt"},
                    "result": None,
                    "error": None,
                    "files": [],
                    "embeds": [],
                }],
            ),
            (
                "",
                False,
                [{
                    "version": 1,
                    "phase": "end",
                    "call_id": "call1",
                    "name": "custom_tool",
                    "arguments": {"path": "foo.txt"},
                    "result": "ok",
                    "error": None,
                    "files": [],
                    "embeds": [],
                }],
            ),
        ]
    @pytest.mark.asyncio
    async def test_bus_progress_forwards_tool_events_to_outbound_metadata(self, tmp_path: Path) -> None:
        """When run() handles a bus message, _tool_events lands in OutboundMessage metadata."""
        bus = MessageBus()
        provider = MagicMock()
        provider.get_default_model.return_value = "test-model"
        loop = AgentLoop(bus=bus, provider=provider, workspace=tmp_path, model="test-model")
        tool_call = ToolCallRequest(id="tc1", name="exec", arguments={"command": "ls"})
        calls = iter([
            LLMResponse(content="", tool_calls=[tool_call]),
            LLMResponse(content="Done", tool_calls=[]),
        ])
        loop.provider.chat_with_retry = AsyncMock(side_effect=lambda *a, **kw: next(calls))
        loop.tools.get_definitions = MagicMock(return_value=[])
        loop.tools.prepare_call = MagicMock(return_value=(None, {"command": "ls"}, None))
        loop.tools.execute = AsyncMock(return_value="file.txt")
        msg = InboundMessage(channel="telegram", chat_id="chat1", content="run ls")
        await loop.run(msg)
        # Drain all outbound messages and find the one carrying _tool_events
        outbound = []
        while bus.outbound_size() > 0:
            outbound.append(await bus.consume_outbound())
        tool_event_msgs = [m for m in outbound if m.metadata and m.metadata.get("_tool_events")]
        assert tool_event_msgs, "expected at least one outbound message with _tool_events"
        start_msgs = [m for m in tool_event_msgs if m.metadata["_tool_events"][0]["phase"] == "start"]
        finish_msgs = [m for m in tool_event_msgs if m.metadata["_tool_events"][0]["phase"] in ("end", "error")]
        assert start_msgs, "expected a start-phase tool event"
        assert finish_msgs, "expected a finish-phase tool event"
        start = start_msgs[0].metadata["_tool_events"][0]
        assert start["name"] == "exec"
        assert start["call_id"] == "tc1"
        assert start["result"] is None
        finish = finish_msgs[0].metadata["_tool_events"][0]
        assert finish["phase"] == "end"
        assert finish["result"] == "file.txt"
--- a/tests/tools/test_message_tool_suppress.py
+++ b/tests/tools/test_message_tool_suppress.py
@ -152,7 +152,6 @@ class TestMessageToolSuppressLogic:
            ('read foo.txt', True),
        ]
 class TestMessageToolTurnTracking:
    def test_sent_in_turn_tracks_same_target(self) -> None: