Validate crawl tool page object types

cursoragent · shrisukhani · cursoragent · commit b5cf933bef00 · 2026-02-13T22:23:54.000Z
Co-authored-by: Shri Sukhani &lt;shrisukhani@users.noreply.github.com&gt;
diff --git a/hyperbrowser/tools/__init__.py b/hyperbrowser/tools/__init__.py
@@ -26,6 +26,15 @@
 
 _MAX_KEY_DISPLAY_LENGTH = 120
 _TRUNCATED_KEY_DISPLAY_SUFFIX = "... (truncated)"
+_NON_OBJECT_CRAWL_PAGE_TYPES = (
+    str,
+    bytes,
+    bytearray,
+    memoryview,
+    int,
+    float,
+    bool,
+)
 
 
 def _format_tool_param_key_for_error(key: str) -> str:
@@ -232,6 +241,10 @@ def _render_crawl_markdown_output(response_data: Any) -> str:
         ) from exc
     markdown_sections: list[str] = []
     for index, page in enumerate(crawl_pages):
+        if page is None or isinstance(page, _NON_OBJECT_CRAWL_PAGE_TYPES):
+            raise HyperbrowserError(
+                f"crawl tool page must be an object at index {index}"
+            )
         page_markdown = _read_crawl_page_field(
             page, field_name="markdown", page_index=index
         )
diff --git a/tests/test_tools_response_handling.py b/tests/test_tools_response_handling.py
@@ -349,6 +349,15 @@ def markdown(self) -> str:
     assert exc_info.value.original_error is not None
 
 
+def test_crawl_tool_rejects_non_object_page_items():
+    client = _SyncCrawlClient(_Response(data=[123]))
+
+    with pytest.raises(
+        HyperbrowserError, match="crawl tool page must be an object at index 0"
+    ):
+        WebsiteCrawlTool.runnable(client, {"url": "https://example.com"})
+
+
 def test_crawl_tool_supports_mapping_page_items():
     client = _SyncCrawlClient(
         _Response(data=[{"url": "https://example.com", "markdown": "mapping body"}])
@@ -491,6 +500,17 @@ async def run() -> None:
     asyncio.run(run())
 
 
+def test_async_crawl_tool_rejects_non_object_page_items():
+    async def run() -> None:
+        client = _AsyncCrawlClient(_Response(data=[123]))
+        with pytest.raises(
+            HyperbrowserError, match="crawl tool page must be an object at index 0"
+        ):
+            await WebsiteCrawlTool.async_runnable(client, {"url": "https://example.com"})
+
+    asyncio.run(run())
+
+
 def test_async_browser_use_tool_rejects_non_string_final_result():
     async def run() -> None:
         client = _AsyncBrowserUseClient(