fix(runner): narrow workspace_violation fatal classification (#3599, helps #3605 #3597)

PR #3493 promoted every shell `_guard_command` rejection to a turn-fatal RuntimeError. The two heuristic outputs in that list -- `path outside working dir` and `path traversal detected` -- routinely false-positive on benign constructs (e.g. `2>/dev/null`, quoted `..` arguments to sed/find, absolute paths inside inline scripts), so legitimate workspace commands silently kill the user's turn (#3599) and the agent never gets a chance to retry with a different approach (#3605). Two changes, both narrowly scoped: - `ExecTool._guard_command` now skips a small allow-list of kernel device files (`/dev/null`, the standard streams, `/dev/random`, `/dev/fd/N`, ...) before the workspace path check, matched against the pre-resolve string so symlinks like `/dev/stderr -> /proc/self/fd/2` still hit the allow-list. Real outside writes such as `> /etc/issue` remain blocked. - `AgentRunner._WORKSPACE_BLOCK_MARKERS` keeps only the four hard path-resolution errors from filesystem.py / shell.py and the SSRF marker. The two heuristic substrings move out of the fatal list, so the LLM sees them as ordinary tool errors and can self-correct in the next iteration. SSRF stays fatal because retrying an internal URL with a different phrasing would defeat the safety boundary. Tests: - `tests/tools/test_exec_security.py`: parametrized regression for the exact #3599 command sample plus other stdio redirects and device reads; explicit negative case asserts `> /etc/issue` is still blocked. - `tests/agent/test_runner.py`: `_is_workspace_violation` no longer fatals on the two heuristic markers, plus an end-to-end case proving the runner hands the guard error back to the LLM and finalizes the next turn cleanly.
2026-05-07 02:05:51 +00:00 · 2026-05-03 16:34:31 +00:00 · 2026-05-03 16:34:31 +00:00 · 7742f8fbdc
commit 7742f8fbdc
parent 9a9e446f3f
4 changed files with 190 additions and 3 deletions
--- a/nanobot/agent/runner.py
+++ b/nanobot/agent/runner.py
@ -831,14 +831,30 @@ class AgentRunner:
            detail = detail[:120] + "..."
        return result, {"name": tool_call.name, "status": "ok", "detail": detail}, None

-    # Markers identifying tool results that represent a workspace / safety boundary rejection.
+    # Markers identifying tool results that represent a *hard* workspace /
+    # safety boundary rejection -- only these abort the agent loop.
+    #
+    # We deliberately keep this list narrow (#3599 / #3605):
+    # - The first four come from explicit path-resolution checks in
+    #   ``filesystem.py`` and ``shell.py`` that cannot false-positive on user
+    #   payloads -- if you see them, the LLM truly tried to escape the
+    #   workspace.
+    # - "internal/private url detected" stays fatal because SSRF is a real
+    #   security boundary; allowing the LLM to "retry" would just let it
+    #   poke internal infra with a different URL phrasing.
+    # - "path traversal detected" and "path outside working dir" are
+    #   intentionally *not* listed: both come from the heuristic
+    #   ``_guard_command`` checks in ``shell.py`` which scan the raw command
+    #   string and routinely false-positive on legitimate constructs (e.g.
+    #   ``2>/dev/null`` redirects, quoted ``..`` arguments to ``sed`` /
+    #   ``find``, paths inside inline scripts).  Treating them as fatal
+    #   silently kills user turns (#3599) and prevents the agent from
+    #   self-correcting by trying a different approach (#3605).
    _WORKSPACE_BLOCK_MARKERS: tuple[str, ...] = (
        "outside the configured workspace",
        "outside allowed directory",
        "working_dir is outside",
        "working_dir could not be resolved",
-        "path traversal detected",
-        "path outside working dir",
        "internal/private url detected",
    )

--- a/nanobot/agent/tools/shell.py
+++ b/nanobot/agent/tools/shell.py
@ -83,6 +83,22 @@ class ExecTool(Tool):
    _MAX_TIMEOUT = 600
    _MAX_OUTPUT = 10_000

+    # Kernel device files that are universally safe as stdio redirect targets
+    # (e.g. ``cmd 2>/dev/null``).  Without this allow-list the workspace guard
+    # treats them as ``path outside working dir`` and the LLM ends up unable
+    # to silence stderr inside the workspace (#3599).
+    _BENIGN_DEVICE_PATHS: frozenset[str] = frozenset({
+        "/dev/null",
+        "/dev/zero",
+        "/dev/full",
+        "/dev/random",
+        "/dev/urandom",
+        "/dev/stdin",
+        "/dev/stdout",
+        "/dev/stderr",
+        "/dev/tty",
+    })
+
    @property
    def description(self) -> str:
        return (
@ -300,10 +316,18 @@ class ExecTool(Tool):
            for raw in self._extract_absolute_paths(cmd):
                try:
                    expanded = os.path.expandvars(raw.strip())
+                    # Match against the un-resolved path first.  On Linux,
+                    # /dev/stderr is a symlink to /proc/self/fd/2 and
+                    # ``Path.resolve()`` would mask the device-file intent.
+                    if self._is_benign_device_path(expanded):
+                        continue
                    p = Path(expanded).expanduser().resolve()
                except Exception:
                    continue

+                if self._is_benign_device_path(str(p)):
+                    continue
+
                media_path = get_media_dir().resolve()
                if (p.is_absolute()
                    and cwd_path not in p.parents
@ -315,6 +339,21 @@ class ExecTool(Tool):

        return None

+    @classmethod
+    def _is_benign_device_path(cls, path: str) -> bool:
+        """Return True when *path* is a kernel device file we should never block.
+
+        Treats ``/dev/null``, the standard streams, ``/dev/random``, etc. as
+        always-safe targets so that idiomatic stdio plumbing such as
+        ``cmd 2>/dev/null`` or ``echo done >/dev/stderr`` is not flagged as a
+        workspace violation regardless of the configured working directory.
+        Also accepts ``/dev/fd/N`` because those are per-process aliases for
+        already-open file descriptors and never escape the workspace.
+        """
+        if path in cls._BENIGN_DEVICE_PATHS:
+            return True
+        return path.startswith("/dev/fd/")
+
    @staticmethod
    def _extract_absolute_paths(command: str) -> list[str]:
        # Windows: match drive-root paths like `C:\` as well as `C:\path\to\file`
--- a/tests/agent/test_runner.py
+++ b/tests/agent/test_runner.py
@ -373,6 +373,79 @@ def test_is_workspace_violation_recognizes_ssrf_block():
    ) is False


+def test_is_workspace_violation_does_not_fatal_on_shell_guard_heuristics():
+    """#3599 / #3605 regression: shell guard heuristics must NOT be fatal.
+
+    ``path outside working dir`` and ``path traversal detected`` are produced
+    by best-effort string scans inside ``ExecTool._guard_command`` -- they
+    routinely false-positive on idiomatic constructs (``2>/dev/null``,
+    ``sed 's|x|../y|g'``) and should be surfaced to the LLM as recoverable
+    tool errors so it can switch tactics, not abort the whole turn.
+    """
+    from nanobot.agent.runner import AgentRunner
+
+    assert AgentRunner._is_workspace_violation(
+        "Error: Command blocked by safety guard (path outside working dir)"
+    ) is False
+    assert AgentRunner._is_workspace_violation(
+        "Error: Command blocked by safety guard (path traversal detected)"
+    ) is False
+
+
+@pytest.mark.asyncio
+async def test_runner_lets_llm_recover_from_shell_guard_path_outside():
+    """End-to-end: a guard-blocked exec is a soft tool error, not a turn-fatal.
+
+    Reporter scenario: a previous PR turned ``path outside working dir`` into
+    a turn-fatal RuntimeError, so when the false-positive guard fired the
+    user got no further iterations and (depending on channel) a silent hang.
+    After narrowing the marker list, the runner must hand the error back to
+    the LLM and let the next iteration succeed normally.
+    """
+    from nanobot.agent.runner import AgentRunSpec, AgentRunner
+
+    provider = MagicMock()
+    captured_second_call: list[dict] = []
+
+    async def chat_with_retry(*, messages, **kwargs):
+        if provider.chat_with_retry.await_count == 1:
+            return LLMResponse(
+                content="trying noisy cleanup",
+                tool_calls=[ToolCallRequest(
+                    id="call_blocked",
+                    name="exec",
+                    arguments={"command": "rm scratch.txt 2>/dev/null"},
+                )],
+            )
+        captured_second_call[:] = list(messages)
+        return LLMResponse(content="recovered final answer", tool_calls=[])
+
+    provider.chat_with_retry = AsyncMock(side_effect=chat_with_retry)
+    tools = MagicMock()
+    tools.get_definitions.return_value = []
+    tools.execute = AsyncMock(
+        return_value="Error: Command blocked by safety guard (path outside working dir)"
+    )
+
+    runner = AgentRunner(provider)
+    result = await runner.run(AgentRunSpec(
+        initial_messages=[],
+        tools=tools,
+        model="test-model",
+        max_iterations=3,
+        max_tool_result_chars=_MAX_TOOL_RESULT_CHARS,
+    ))
+
+    assert provider.chat_with_retry.await_count == 2, (
+        "guard hit must NOT short-circuit the loop -- LLM should get a second turn"
+    )
+    assert result.stop_reason != "tool_error"
+    assert result.error is None
+    assert result.final_content == "recovered final answer"
+    assert result.tool_events and result.tool_events[0]["status"] == "error"
+    assert "workspace_violation" not in result.tool_events[0]["detail"]
+
+
@pytest.mark.asyncio
 async def test_runner_persists_large_tool_results_for_follow_up_calls(tmp_path):
    from nanobot.agent.runner import AgentRunSpec, AgentRunner
--- a/tests/tools/test_exec_security.py
+++ b/tests/tools/test_exec_security.py
@ -182,3 +182,62 @@ async def test_exec_ignores_workspace_check_when_not_restricted(tmp_path):
    result = await tool.execute(command="echo ok", working_dir=str(other))
    assert "ok" in result
    assert "outside the configured workspace" not in result
+
+
+# --- #3599: stdio redirects to /dev/null must not trip the workspace guard ----
+
+
+@pytest.mark.parametrize(
+    "command",
+    [
+        # The exact command from the #3599 reporter.
+        'rm test_print.txt 2>/dev/null; echo "done"',
+        # Plain redirect of stdout / stderr.
+        "find . -type f >/dev/null",
+        "noisy_cmd 2>/dev/null",
+        "noisy_cmd >/dev/null 2>&1",
+        # Read from /dev/urandom is also a benign device read.
+        "head -c 16 /dev/urandom | xxd",
+        "echo done >/dev/stderr",
+        "echo line </dev/stdin",
+        # Per-process FD aliases never escape the workspace.
+        "cat /dev/fd/3",
+    ],
+)
+def test_exec_allows_benign_device_targets_inside_workspace(tmp_path, command):
+    workspace = tmp_path / "workspace"
+    workspace.mkdir()
+    tool = ExecTool(working_dir=str(workspace), restrict_to_workspace=True)
+    assert tool._guard_command(command, str(workspace)) is None
+
+
+@pytest.mark.asyncio
+async def test_exec_3599_regression_rm_with_dev_null_redirect(tmp_path):
+    """#3599: ``rm <ws-path> 2>/dev/null`` must succeed against the workspace guard."""
+    workspace = tmp_path / "workspace"
+    workspace.mkdir()
+    target = workspace / "test_print.txt"
+    target.write_text("scratch")
+    tool = ExecTool(working_dir=str(workspace), restrict_to_workspace=True, timeout=5)
+    result = await tool.execute(
+        command=f'rm {target} 2>/dev/null; echo "done"',
+        working_dir=str(workspace),
+    )
+    assert "done" in result
+    assert "path outside working dir" not in result
+    assert not target.exists()
+
+
+def test_exec_still_blocks_real_outside_path_via_redirect(tmp_path):
+    """Redirect *targets* outside the workspace (not /dev/...) must still be blocked.
+
+    We only whitelist kernel device files; arbitrary outside redirects such as
+    ``> /etc/issue`` should remain caught by the workspace guard so a buggy
+    LLM cannot exfiltrate data outside the workspace via stderr redirection.
+    """
+    workspace = tmp_path / "workspace"
+    workspace.mkdir()
+    tool = ExecTool(working_dir=str(workspace), restrict_to_workspace=True)
+    blocked = tool._guard_command("echo pwn > /etc/issue", str(workspace))
+    assert blocked is not None
+    assert "path outside working dir" in blocked