From c3ee6391b54d902b9586a23e30416062fef95fa4 Mon Sep 17 00:00:00 2001
From: sena-labs <218400180+sena-labs@users.noreply.github.com>
Date: Tue, 2 Jun 2026 00:35:24 +0200
Subject: [PATCH] test(browser): add regression tests for issue #723 error
 clarity
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Guard against reintroducing the vague 'Task reached step limit without
completion. Last page: about:blank' message that the removed browser-use
agent produced when the underlying LLM provider rejected structured-output
headers (e.g. 'anthropic-beta: structured-outputs-2025-11-13').

The current Playwright-based browser tool returns specific, actionable
messages for each failure mode:
- Runtime unavailable  → 'Browser runtime unavailable: <reason>'
- Action call failure  → 'Browser <action> failed: <reason>'
- Unknown action       → 'Unknown browser action: <name>'

Three new tests verify these contracts and assert the old confusing
wording is absent.

Closes #723

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
---
 tests/test_browser_agent_regressions.py | 109 ++++++++++++++++++++++++
 1 file changed, 109 insertions(+)
diff --git a/tests/test_browser_agent_regressions.py b/tests/test_browser_agent_regressions.py
index ab39875670..ed4d39f720 100644
--- a/tests/test_browser_agent_regressions.py
+++ b/tests/test_browser_agent_regressions.py
@@ -2940,3 +2940,112 @@ def test_legacy_browser_dependency_is_removed():
     assert ("browser" + "-use") not in (PROJECT_ROOT / "requirements.txt").read_text(
         encoding="utf-8"
     )
+
+
+# ---------------------------------------------------------------------------
+# Regression: issue #723 — browser failures must return clear error messages
+#
+# The removed browser-use agent produced "Task reached step limit without
+# completion. Last page: about:blank" when the underlying LLM provider
+# rejected structured-output headers.  The current Playwright-based tool
+# must return actionable errors instead.
+# ---------------------------------------------------------------------------
+
+
+@pytest.mark.anyio
+async def test_browser_tool_returns_clear_error_when_runtime_unavailable(monkeypatch):
+    """Browser tool surfaces a clear message when the runtime cannot start.
+
+    Covers the provider-rejection scenario from issue #723 where API errors
+    (e.g. unsupported ``anthropic-beta`` headers, grammar-too-large replies)
+    caused the old browser-use agent to silently exhaust its step budget and
+    return a confusing "about:blank / step limit" message.  The current tool
+    must propagate a human-readable error immediately instead.
+    """
+
+    async def _failing_get_runtime(context_id, create=True, agent=None):
+        raise RuntimeError(
+            "litellm.BadRequestError: structured-outputs-2025-11-13 not supported"
+        )
+
+    monkeypatch.setattr(browser_tool_module, "get_runtime", _failing_get_runtime)
+    tool = browser_tool_module.Browser(
+        agent=SimpleNamespace(context=SimpleNamespace(id="ctx")),
+        name="browser",
+        method=None,
+        args={},
+        message="",
+        loop_data=None,
+    )
+
+    response = await tool.execute(action="open", url="https://example.com")
+
+    assert response.break_loop is False
+    assert "runtime unavailable" in response.message.lower()
+    # Must not reproduce the old vague "step limit / about:blank" wording
+    assert "step limit" not in response.message.lower()
+    assert "about:blank" not in response.message
+
+
+@pytest.mark.anyio
+async def test_browser_action_failure_names_the_failed_action(monkeypatch):
+    """Browser tool identifies the failing action when runtime.call raises.
+
+    Complements test_browser_tool_returns_clear_error_when_runtime_unavailable
+    for the case where the runtime starts successfully but a subsequent call
+    fails (e.g. CDP disconnection, page crash).  The error must name the
+    action so operators can triage without reading raw tracebacks.
+    """
+
+    class _FailingRuntime:
+        async def call(self, method, *args, **kwargs):
+            raise RuntimeError("CDP connection lost")
+
+    async def _ok_get_runtime(context_id, create=True, agent=None):
+        return _FailingRuntime()
+
+    monkeypatch.setattr(browser_tool_module, "get_runtime", _ok_get_runtime)
+    tool = browser_tool_module.Browser(
+        agent=SimpleNamespace(context=SimpleNamespace(id="ctx")),
+        name="browser",
+        method=None,
+        args={},
+        message="",
+        loop_data=None,
+    )
+
+    response = await tool.execute(action="navigate", browser_id=1, url="https://example.com")
+
+    assert response.break_loop is False
+    assert "navigate" in response.message
+    assert "failed" in response.message.lower()
+    assert "step limit" not in response.message.lower()
+    assert "about:blank" not in response.message
+
+
+@pytest.mark.anyio
+async def test_browser_unknown_action_returns_informative_message(monkeypatch):
+    """Unknown action keyword returns an informative error, not a blank failure."""
+
+    class _NeverCalledRuntime:
+        async def call(self, method, *args, **kwargs):
+            raise AssertionError("runtime.call should not be reached for unknown action")
+
+    async def _ok_get_runtime(context_id, create=True, agent=None):
+        return _NeverCalledRuntime()
+
+    monkeypatch.setattr(browser_tool_module, "get_runtime", _ok_get_runtime)
+    tool = browser_tool_module.Browser(
+        agent=SimpleNamespace(context=SimpleNamespace(id="ctx")),
+        name="browser",
+        method=None,
+        args={},
+        message="",
+        loop_data=None,
+    )
+
+    response = await tool.execute(action="nonexistent_action_xyz")
+
+    assert response.break_loop is False
+    assert "nonexistent_action_xyz" in response.message
+    assert "step limit" not in response.message.lower()