OpenHands
diff --git a/‎docs.json‎
Lines changed: 33 additions & 5 deletions b/‎docs.json‎
Lines changed: 33 additions & 5 deletions
diff --git a/‎sdk/guides/agent-browser-use.mdx‎
Lines changed: 119 additions & 0 deletions b/‎sdk/guides/agent-browser-use.mdx‎
Lines changed: 119 additions & 0 deletions
@@ -174,7 +174,7 @@
         ]
       },
       {
-        "tab": "Agent SDK (v1)",
+        "tab": "SDK",
         "pages": [
           "sdk/index",
           "sdk/getting-started",
@@ -184,6 +184,38 @@
               "sdk/guides/hello-world",
               "sdk/guides/custom-tools",
               "sdk/guides/mcp",
+              "sdk/guides/skill",
+              "sdk/guides/context-condenser",
+              "sdk/guides/security",
+              "sdk/guides/metrics",
+              "sdk/guides/secrets",
+              {
+                "group": "LLM Features",
+                "pages": [
+                  "sdk/guides/llm-registry",
+                  "sdk/guides/llm-routing",
+                  "sdk/guides/llm-reasoning",
+                  "sdk/guides/llm-image-input"
+                ]
+              },
+              {
+                "group": "Agent Features",
+                "pages": [
+                  "sdk/guides/agent-interactive-terminal",
+                  "sdk/guides/agent-browser-use",
+                  "sdk/guides/agent-custom",
+                  "sdk/guides/agent-stuck-detector"
+                ]
+              },
+              {
+                "group": "Conversation Features",
+                "pages": [
+                  "sdk/guides/convo-persistence",
+                  "sdk/guides/convo-pause-and-resume",
+                  "sdk/guides/convo-send-message-while-running",
+                  "sdk/guides/convo-async"
+                ]
+              },
               {
                 "group": "Remote Agent Server",
                 "pages": [
@@ -226,10 +258,6 @@
       {
           "tab": "OpenHands (Core) API",
           "openapi": "openapi/openapi.json"
-      },
-      {
-          "tab": "Agent SDK (API)",
-          "openapi": "openapi/agent-sdk.json"
       }
     ],
     "global": {
 
@@ -0,0 +1,119 @@
+---
+title: Browser Use
+description: Enable web browsing and interaction capabilities for your agent.
+---
+
+<Note>
+This example is available on GitHub: [examples/01_standalone_sdk/15_browser_use.py](https://github.com/All-Hands-AI/agent-sdk/blob/main/examples/01_standalone_sdk/15_browser_use.py)
+</Note>
+
+The BrowserToolSet integration enables your agent to interact with web pages through automated browser control. Built on top of [browser-use](https://github.com/browser-use/browser-use), it provides capabilities for navigating websites, clicking elements, filling forms, and extracting content - all through natural language instructions.
+
+```python icon="python" expandable examples/01_standalone_sdk/15_browser_use.py
+import os
+
+from pydantic import SecretStr
+
+from openhands.sdk import (
+    LLM,
+    Agent,
+    Conversation,
+    Event,
+    LLMConvertibleEvent,
+    get_logger,
+)
+from openhands.sdk.tool import Tool, register_tool
+from openhands.tools.browser_use import BrowserToolSet
+from openhands.tools.execute_bash import BashTool
+from openhands.tools.file_editor import FileEditorTool
+
+
+logger = get_logger(__name__)
+
+# Configure LLM
+api_key = os.getenv("LLM_API_KEY")
+assert api_key is not None, "LLM_API_KEY environment variable is not set."
+model = os.getenv("LLM_MODEL", "openhands/claude-sonnet-4-5-20250929")
+base_url = os.getenv("LLM_BASE_URL")
+llm = LLM(
+    usage_id="agent",
+    model=model,
+    base_url=base_url,
+    api_key=SecretStr(api_key),
+)
+
+# Tools
+cwd = os.getcwd()
+register_tool("BashTool", BashTool)
+register_tool("FileEditorTool", FileEditorTool)
+register_tool("BrowserToolSet", BrowserToolSet)
+tools = [
+    Tool(
+        name="BashTool",
+    ),
+    Tool(name="FileEditorTool"),
+    Tool(name="BrowserToolSet"),
+]
+
+# If you need fine-grained browser control, you can manually register individual browser
+# tools by creating a BrowserToolExecutor and providing factories that return customized
+# Tool instances before constructing the Agent.
+
+# Agent
+agent = Agent(llm=llm, tools=tools)
+
+llm_messages = []  # collect raw LLM messages
+
+
+def conversation_callback(event: Event):
+    if isinstance(event, LLMConvertibleEvent):
+        llm_messages.append(event.to_llm_message())
+
+
+conversation = Conversation(
+    agent=agent, callbacks=[conversation_callback], workspace=cwd
+)
+
+conversation.send_message(
+    "Could you go to https://openhands.dev/ blog page and summarize main "
+    "points of the latest blog?"
+)
+conversation.run()
+
+
+print("=" * 100)
+print("Conversation finished. Got the following LLM messages:")
+for i, message in enumerate(llm_messages):
+    print(f"Message {i}: {str(message)[:200]}")
+```
+
+```bash Running the Example
+export LLM_API_KEY="your-api-key"
+cd agent-sdk
+uv run python examples/01_standalone_sdk/15_browser_use.py
+```
+
+## How It Works
+
+The example demonstrates combining multiple tools to create a capable web research agent:
+
+1. **BrowserToolSet**: Provides automated browser control for web interaction
+2. **FileEditorTool**: Allows the agent to read and write files if needed
+3. **BashTool**: Enables command-line operations for additional functionality
+
+The agent uses these tools to:
+- Navigate to specified URLs
+- Interact with web page elements (clicking, scrolling, etc.)
+- Extract and analyze content from web pages
+- Summarize information from multiple sources
+
+In this example, the agent visits the openhands.dev blog, finds the latest blog post, and provides a summary of its main points.
+
+## Customization
+
+For advanced use cases requiring only a subset of browser tools or custom configurations, you can manually register individual browser tools. Refer to the [BrowserToolSet definition](https://github.com/All-Hands-AI/agent-sdk/blob/main/openhands-tools/openhands/tools/browser_use/definition.py) to see the available individual tools and create a `BrowserToolExecutor` with customized tool configurations before constructing the Agent. This gives you fine-grained control over which browser capabilities are exposed to the agent.
+
+## Next Steps
+
+- **[Custom Tools](/sdk/guides/custom-tools)** - Create specialized tools
+- **[MCP Integration](/sdk/guides/mcp)** - Connect external services