From 09312a2cc52829b3e04b85eb9fcdaca3353f0305 Mon Sep 17 00:00:00 2001
From: Mish Ushakov <10400064+mishushakov@users.noreply.github.com>
Date: Wed, 15 Apr 2026 16:27:24 +0200
Subject: [PATCH] Add OpenAI Agents SDK sandbox docs

---
 docs.json                          |   1 +
 docs/agents/openai-agents-sdk.mdx  | 583 +++++++++++++++++++++++++++++
 images/icons/openai-agents-sdk.svg |   8 +
 3 files changed, 592 insertions(+)
 create mode 100644 docs/agents/openai-agents-sdk.mdx
 create mode 100644 images/icons/openai-agents-sdk.svg

diff --git a/docs.json b/docs.json
index 21a5608a..a45830f5 100644
--- a/docs.json
+++ b/docs.json
@@ -56,6 +56,7 @@
               "docs/agents/amp",
               "docs/agents/claude-code",
               "docs/agents/codex",
+              "docs/agents/openai-agents-sdk",
               {
                 "group": "OpenClaw",
                 "icon": "https://mintlify.s3.us-west-1.amazonaws.com/e2b-openclaw-icon/images/icons/openclaw.svg",
diff --git a/docs/agents/openai-agents-sdk.mdx b/docs/agents/openai-agents-sdk.mdx
new file mode 100644
index 00000000..95b2c6a4
--- /dev/null
+++ b/docs/agents/openai-agents-sdk.mdx
@@ -0,0 +1,583 @@
+---
+title: "OpenAI Agents SDK"
+description: "Use E2B sandboxes with the OpenAI Agents SDK."
+icon: "/images/icons/openai-agents-sdk.svg"
+---
+
+The [OpenAI Agents SDK](https://github.com/openai/openai-agents-python) is a framework for building agentic workflows. E2B provides a native integration that lets you run `SandboxAgent` instances inside isolated E2B sandboxes — giving your agents full filesystem, terminal, and network access in a secure environment.
+
+To use E2B as the sandbox backend:
+
+1. Create a sandbox session with `E2BSandboxClient`.
+2. Build a `SandboxAgent` with your instructions and model.
+3. Run the agent and pass the sandbox session through `RunConfig`.
+
+## Install the dependencies
+
+Install the [OpenAI Agents SDK](https://pypi.org/project/openai-agents/) with the E2B extra to pull in the sandbox integration.
+
+```bash
+pip install openai-agents[e2b]
+```
+
+You will also need API keys for OpenAI and E2B.
+
+```bash
+export OPENAI_API_KEY="..."
+export E2B_API_KEY="..."
+```
+
+## Basic example
+
+Create an `E2BSandboxClient`, start a session, and run a `SandboxAgent` inside it. The agent gets full access to the sandbox environment — it can run commands, read and write files, and inspect the workspace.
+
+### Create a session
+
+Initialize the `E2BSandboxClient` and create a sandbox session. The `pause_on_exit` option keeps the sandbox available after the script finishes so you can inspect its state.
+
+```python
+from agents.extensions.sandbox import (
+    E2BSandboxClient,
+    E2BSandboxClientOptions,
+    E2BSandboxType,
+)
+
+client = E2BSandboxClient()
+session = await client.create(
+    options=E2BSandboxClientOptions(
+        sandbox_type=E2BSandboxType.E2B,
+        timeout=900,
+        pause_on_exit=True,
+    )
+)
+```
+
+### Build and run the agent
+
+Define a `SandboxAgent` with a name, model, and instructions, then run it against the sandbox session using `Runner.run`. The result contains the agent's final output.
+
+```python
+from agents import ModelSettings, Runner
+from agents.run import RunConfig
+from agents.sandbox import SandboxAgent, SandboxRunConfig
+
+agent = SandboxAgent(
+    name="Workspace Inspector",
+    model="gpt-5.4",
+    instructions=(
+        "Inspect the workspace, explain what files exist, and summarize the project."
+    ),
+    model_settings=ModelSettings(tool_choice="required"),
+)
+
+result = await Runner.run(
+    agent,
+    "Look around the workspace and summarize what you find.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=session)),
+)
+print(result.final_output)
+```
+
+### Shut down
+
+Always shut down the session when you're done to release sandbox resources.
+
+```python
+await session.shutdown()
+```
+
+### Full example
+
+The complete script that ties the steps above together.
+
+```python expandable
+import asyncio
+
+from agents import ModelSettings, Runner
+from agents.run import RunConfig
+from agents.sandbox import SandboxAgent, SandboxRunConfig
+from agents.extensions.sandbox import (
+    E2BSandboxClient,
+    E2BSandboxClientOptions,
+    E2BSandboxType,
+)
+
+
+async def main() -> None:
+    client = E2BSandboxClient()
+    session = await client.create(
+        options=E2BSandboxClientOptions(
+            sandbox_type=E2BSandboxType.E2B,
+            timeout=900,
+            pause_on_exit=True,
+        )
+    )
+
+    try:
+        agent = SandboxAgent(
+            name="Workspace Inspector",
+            model="gpt-5.4",
+            instructions=(
+                "Inspect the workspace, explain what files exist, and summarize the project."
+            ),
+            model_settings=ModelSettings(tool_choice="required"),
+        )
+
+        result = await Runner.run(
+            agent,
+            "Look around the workspace and summarize what you find.",
+            run_config=RunConfig(sandbox=SandboxRunConfig(session=session)),
+        )
+        print(result.final_output)
+    finally:
+        await session.shutdown()
+
+
+asyncio.run(main())
+```
+
+---
+
+## Build an app with multiple versions
+
+A common pattern is to start from the same starter app and create multiple versions in separate sandboxes — useful when comparing a first pass with a polished revision, or generating live preview URLs for each version.
+
+Based on the [`homepage_vite_basic_updated.ipynb`](https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/homepage_vite_basic_updated.ipynb) notebook from the Agents SDK repo.
+
+### Define a manifest
+
+A `Manifest` describes the starter files your agent will work with. Each entry is a `File` with its content encoded as bytes. This lets you seed multiple sandboxes from the same baseline — useful when comparing different versions of an app.
+
+```python
+from agents.sandbox import Manifest
+from agents.sandbox.entries import File
+
+def build_manifest() -> Manifest:
+    return Manifest(
+        entries={
+            "package.json": File(content=PACKAGE_JSON.encode()),
+            "index.html": File(content=INDEX_HTML.encode()),
+            "vite.config.js": File(content=VITE_CONFIG_JS.encode()),
+            "src/main.tsx": File(content=MAIN_TSX.encode()),
+            "src/App.tsx": File(content=APP_TSX.encode()),
+        }
+    )
+```
+
+### Create a sandbox session
+
+Create a sandbox session with the manifest, exposed ports for live previews, and internet access so the agent can install npm packages.
+
+```python
+from agents.extensions.sandbox import (
+    E2BSandboxClient,
+    E2BSandboxClientOptions,
+    E2BSandboxType,
+)
+
+session = await E2BSandboxClient().create(
+    manifest=build_manifest(),
+    options=E2BSandboxClientOptions(
+        sandbox_type=E2BSandboxType.E2B,
+        timeout=1800,
+        exposed_ports=(4173,),
+        allow_internet_access=True,
+        pause_on_exit=True,
+    ),
+)
+await session.start()
+```
+
+### Run the agent
+
+Build a `SandboxAgent` with capabilities like `ApplyPatch` and `Shell`, then run it against the sandbox session.
+
+```python
+from agents import ModelSettings, Runner
+from agents.run import RunConfig
+from agents.sandbox import SandboxAgent, SandboxRunConfig
+from agents.sandbox.capabilities import ApplyPatch, Shell
+
+agent = SandboxAgent(
+    name="E2B Vite Builder",
+    model="gpt-5.4-mini",
+    instructions="Update the Vite app in the sandbox workspace and return a concise summary.",
+    default_manifest=build_manifest(),
+    capabilities=[ApplyPatch(), Shell()],
+    model_settings=ModelSettings(tool_choice="required"),
+)
+
+result = await Runner.run(
+    agent,
+    "Make the basic version now.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=session)),
+)
+```
+
+### Start a preview server
+
+After the agent finishes, install dependencies, start the Vite dev server, and resolve the exposed port to get a live preview URL.
+
+```python
+await session.exec(
+    "sh", "-lc",
+    (
+        "npm install >/tmp/e2b-demo-npm-install.log 2>&1 && "
+        "nohup npm run dev -- --host 0.0.0.0 --port 4173 "
+        ">/tmp/e2b-demo-vite.log 2>&1 &"
+    ),
+    shell=False,
+    timeout=120,
+)
+preview_url = (await session.resolve_exposed_port(4173)).url_for("http")
+```
+
+### Full example
+
+The complete `run_version()` helper ties all the steps above together. Call it once per version to get isolated sandboxes with their own preview URLs. Based on the [`homepage_vite_basic_updated.ipynb`](https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/homepage_vite_basic_updated.ipynb) notebook from the Agents SDK repo.
+
+```python expandable
+from agents import ModelSettings, Runner
+from agents.run import RunConfig
+from agents.sandbox import Manifest, SandboxAgent, SandboxRunConfig
+from agents.sandbox.capabilities import ApplyPatch, Shell
+from agents.sandbox.entries import File
+from agents.extensions.sandbox import (
+    E2BSandboxClient,
+    E2BSandboxClientOptions,
+    E2BSandboxType,
+)
+
+
+def build_manifest() -> Manifest:
+    return Manifest(
+        entries={
+            "package.json": File(content=PACKAGE_JSON.encode()),
+            "index.html": File(content=INDEX_HTML.encode()),
+            "vite.config.js": File(content=VITE_CONFIG_JS.encode()),
+            "src/main.tsx": File(content=MAIN_TSX.encode()),
+            "src/App.tsx": File(content=APP_TSX.encode()),
+        }
+    )
+
+
+async def run_version(version_name: str, version_prompt: str) -> dict[str, str]:
+    session = await E2BSandboxClient().create(
+        manifest=build_manifest(),
+        options=E2BSandboxClientOptions(
+            sandbox_type=E2BSandboxType.E2B,
+            timeout=1800,
+            exposed_ports=(4173,),
+            allow_internet_access=True,
+            pause_on_exit=True,
+        ),
+    )
+    await session.start()
+
+    agent = SandboxAgent(
+        name=f"E2B Vite {version_name.title()} Builder",
+        model="gpt-5.4-mini",
+        instructions=(
+            "Update the Vite app in the sandbox workspace and return a concise summary."
+        ),
+        developer_instructions=(
+            f"Version goal: {version_prompt}\n"
+            "Start from the tiny Vite starter. You may create src/styles.css if you want."
+        ),
+        default_manifest=build_manifest(),
+        capabilities=[ApplyPatch(), Shell()],
+        model_settings=ModelSettings(tool_choice="required"),
+    )
+
+    result = await Runner.run(
+        agent,
+        f"Make the {version_name} version now.",
+        run_config=RunConfig(sandbox=SandboxRunConfig(session=session)),
+    )
+
+    await session.exec(
+        "sh", "-lc",
+        (
+            "npm install >/tmp/e2b-demo-npm-install.log 2>&1 && "
+            "nohup npm run dev -- --host 0.0.0.0 --port 4173 "
+            ">/tmp/e2b-demo-vite.log 2>&1 &"
+        ),
+        shell=False,
+        timeout=120,
+    )
+    preview_url = (await session.resolve_exposed_port(4173)).url_for("http")
+
+    return {
+        "summary": str(result.final_output),
+        "preview_url": preview_url,
+    }
+```
+
+---
+
+## MCP-powered research agents
+
+You can create sandboxes with [MCP](https://modelcontextprotocol.io/) servers enabled, then connect the Agents SDK to the sandbox's MCP gateway. This gives you an agent that can discover sources with search-oriented MCP servers, verify pages in a browser, and keep all of that execution inside the sandbox.
+
+The Agents SDK repo includes a concrete example in [`deep_research_mcp.py`](https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/deep_research_mcp.py).
+
+### Configure MCP servers
+
+Pass MCP server configurations when creating the sandbox session. This example enables [Browserbase](https://www.browserbase.com/) for browser automation and [Exa](https://exa.ai/) for search.
+
+```python
+session = await client.create(
+    options=E2BSandboxClientOptions(
+        sandbox_type=E2BSandboxType.E2B,
+        timeout=900,
+        pause_on_exit=True,
+        mcp={
+            "browserbase": {
+                "apiKey": os.environ["BROWSERBASE_API_KEY"],
+                "geminiApiKey": os.environ["GEMINI_API_KEY"],
+                "projectId": os.environ["BROWSERBASE_PROJECT_ID"],
+            },
+            "exa": {
+                "apiKey": os.environ["EXA_API_KEY"],
+            },
+        },
+    ),
+)
+```
+
+### Connect to the MCP gateway
+
+Use `MCPServerStreamableHttp` to connect to the sandbox's MCP gateway. This gives the agent access to all the MCP servers you configured above.
+
+```python
+from agents.mcp import MCPServerStreamableHttp
+
+async with MCPServerStreamableHttp(
+    name="E2B MCP Gateway",
+    params={
+        "url": mcp_url,
+        "headers": {"Authorization": f"Bearer {mcp_token}"},
+        "timeout": 30,
+        "sse_read_timeout": 300,
+    },
+) as server:
+    ...
+```
+
+### Run the agent
+
+Pass the MCP server to the `SandboxAgent` via `mcp_servers`. The agent can now discover and call tools from all configured MCP servers.
+
+```python
+from agents import ModelSettings, Runner
+from agents.run import RunConfig
+from agents.sandbox import SandboxAgent, SandboxRunConfig
+
+agent = SandboxAgent(
+    name="Deep Research Assistant",
+    model="gpt-5.4",
+    instructions=(
+        "Use Exa to discover strong sources and Browserbase to verify important claims."
+    ),
+    mcp_servers=[server],
+    model_settings=ModelSettings(tool_choice="required"),
+)
+
+result = await Runner.run(
+    agent,
+    "Research browser automation infrastructure for AI agents.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=session)),
+)
+```
+
+### Full example
+
+The complete script combining session creation, MCP gateway connection, and agent execution.
+
+```python expandable
+from agents import ModelSettings, Runner
+from agents.mcp import MCPServerStreamableHttp
+from agents.run import RunConfig
+from agents.sandbox import SandboxAgent, SandboxRunConfig
+
+session = await client.create(
+    options=E2BSandboxClientOptions(
+        sandbox_type=E2BSandboxType.E2B,
+        timeout=900,
+        pause_on_exit=True,
+        mcp={
+            "browserbase": {
+                "apiKey": os.environ["BROWSERBASE_API_KEY"],
+                "geminiApiKey": os.environ["GEMINI_API_KEY"],
+                "projectId": os.environ["BROWSERBASE_PROJECT_ID"],
+            },
+            "exa": {
+                "apiKey": os.environ["EXA_API_KEY"],
+            },
+        },
+    ),
+)
+
+async with MCPServerStreamableHttp(
+    name="E2B MCP Gateway",
+    params={
+        "url": mcp_url,
+        "headers": {"Authorization": f"Bearer {mcp_token}"},
+        "timeout": 30,
+        "sse_read_timeout": 300,
+    },
+) as server:
+    agent = SandboxAgent(
+        name="Deep Research Assistant",
+        model="gpt-5.4",
+        instructions=(
+            "Use Exa to discover strong sources and Browserbase to verify important claims."
+        ),
+        mcp_servers=[server],
+        model_settings=ModelSettings(tool_choice="required"),
+    )
+
+    result = await Runner.run(
+        agent,
+        "Research browser automation infrastructure for AI agents.",
+        run_config=RunConfig(sandbox=SandboxRunConfig(session=session)),
+    )
+```
+
+---
+
+## Parallel sandbox workers
+
+Use one coordinator agent to launch multiple specialized review or analysis lanes across separate sandboxes. Each lane runs in its own isolated environment, and the coordinator synthesizes the results into a single summary.
+
+The Agents SDK repo includes a concrete example in [`fullstack_code_review_parallel.py`](https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/fullstack_code_review_parallel.py). That example uses separate E2B-backed lanes for frontend review, backend review, and git tree review.
+
+### Define the agents
+
+Create specialized `SandboxAgent` instances for each review lane, plus a regular `Agent` as the coordinator that will synthesize the results.
+
+```python
+from agents import Agent
+from agents.sandbox import SandboxAgent
+
+frontend_agent = SandboxAgent(
+    name="Frontend Reviewer",
+    model="gpt-5.4",
+    instructions="Review the rendered frontend and identify UX and code risks.",
+)
+
+backend_agent = SandboxAgent(
+    name="Backend Reviewer",
+    model="gpt-5.4",
+    instructions="Review the API implementation and identify validation and auth risks.",
+)
+
+coordinator = Agent(
+    name="Review Coordinator",
+    model="gpt-5.4",
+    instructions=(
+        "Run the available review lanes, compare their evidence, and produce a single summary."
+    ),
+)
+```
+
+### Run the lanes
+
+Run each review agent against its own sandbox session. The lanes are independent and can run concurrently.
+
+```python
+from agents import Runner
+from agents.run import RunConfig
+from agents.sandbox import SandboxRunConfig
+
+frontend_result = await Runner.run(
+    frontend_agent,
+    "Review the frontend workspace.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=frontend_session)),
+)
+
+backend_result = await Runner.run(
+    backend_agent,
+    "Review the backend workspace.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=backend_session)),
+)
+```
+
+### Synthesize the results
+
+Feed the findings from each lane into the coordinator agent to produce a single summary.
+
+```python
+final_result = await Runner.run(
+    coordinator,
+    f"Frontend findings: {frontend_result.final_output}\n\n"
+    f"Backend findings: {backend_result.final_output}",
+)
+```
+
+### Full example
+
+The complete script defining agents, running parallel review lanes, and synthesizing results.
+
+```python expandable
+from agents import Agent, Runner
+from agents.run import RunConfig
+from agents.sandbox import SandboxAgent, SandboxRunConfig
+
+frontend_agent = SandboxAgent(
+    name="Frontend Reviewer",
+    model="gpt-5.4",
+    instructions="Review the rendered frontend and identify UX and code risks.",
+)
+
+backend_agent = SandboxAgent(
+    name="Backend Reviewer",
+    model="gpt-5.4",
+    instructions="Review the API implementation and identify validation and auth risks.",
+)
+
+coordinator = Agent(
+    name="Review Coordinator",
+    model="gpt-5.4",
+    instructions=(
+        "Run the available review lanes, compare their evidence, and produce a single summary."
+    ),
+)
+
+frontend_result = await Runner.run(
+    frontend_agent,
+    "Review the frontend workspace.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=frontend_session)),
+)
+
+backend_result = await Runner.run(
+    backend_agent,
+    "Review the backend workspace.",
+    run_config=RunConfig(sandbox=SandboxRunConfig(session=backend_session)),
+)
+
+final_result = await Runner.run(
+    coordinator,
+    f"Frontend findings: {frontend_result.final_output}\n\n"
+    f"Backend findings: {backend_result.final_output}",
+)
+```
+
+## Reference examples
+
+The OpenAI Agents SDK repository includes several complete examples demonstrating E2B sandbox integration.
+
+<CardGroup cols={2}>
+  <Card title="Basic and updated app" icon="code" href="https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/homepage_vite_basic_updated.ipynb">
+    Build and iterate on a Vite app across isolated sandboxes
+  </Card>
+  <Card title="MCP deep research" icon="magnifying-glass" href="https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/deep_research_mcp.py">
+    Research agent with Browserbase and Exa via MCP
+  </Card>
+  <Card title="Parallel code review" icon="code-branch" href="https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/fullstack_code_review_parallel.py">
+    Multi-lane code review with a coordinator agent
+  </Card>
+  <Card title="E2B agents setup" icon="gear" href="https://github.com/openai/openai-agents-python/blob/main/examples/sandbox/e2b_demos/e2b_agents_setup.ipynb">
+    Getting started notebook for E2B sandbox integration
+  </Card>
+</CardGroup>
diff --git a/images/icons/openai-agents-sdk.svg b/images/icons/openai-agents-sdk.svg
new file mode 100644
index 00000000..bb4a9c44
--- /dev/null
+++ b/images/icons/openai-agents-sdk.svg
@@ -0,0 +1,8 @@
+<svg viewBox="0 0 512 512" xmlns="http://www.w3.org/2000/svg" fill-rule="evenodd" clip-rule="evenodd" stroke-linejoin="round" stroke-miterlimit="2">
+<style>
+  .openai-agents-sdk-path { fill: #000000; }
+  @media (prefers-color-scheme: dark) {
+    .openai-agents-sdk-path { fill: #FFFFFF; }
+  }
+</style>
+<path class="openai-agents-sdk-path" d="M474.123 209.81c11.525-34.577 7.569-72.423-10.838-103.904-27.696-48.168-83.433-72.94-137.794-61.414a127.14 127.14 0 00-95.475-42.49c-55.564 0-104.936 35.781-122.139 88.593-35.781 7.397-66.574 29.76-84.637 61.414-27.868 48.167-21.503 108.72 15.826 150.007-11.525 34.578-7.569 72.424 10.838 103.733 27.696 48.34 83.433 73.111 137.966 61.585 24.084 27.18 58.833 42.835 95.303 42.663 55.564 0 104.936-35.782 122.139-88.594 35.782-7.397 66.574-29.76 84.465-61.413 28.04-48.168 21.676-108.722-15.654-150.008v-.172zm-39.567-87.218c11.01 19.267 15.139 41.803 11.354 63.65-.688-.516-2.064-1.204-2.924-1.72l-101.152-58.49a16.965 16.965 0 00-16.687 0L206.621 194.5v-50.232l97.883-56.597c45.587-26.32 103.732-10.666 130.052 34.921zm-227.935 104.42l49.888-28.9 49.887 28.9v57.63l-49.887 28.9-49.888-28.9v-57.63zm23.223-191.81c22.364 0 43.867 7.742 61.07 22.02-.688.344-2.064 1.204-3.097 1.72L186.666 117.26c-5.161 2.925-8.258 8.43-8.258 14.45v136.934l-43.523-25.116V130.333c0-52.64 42.491-95.13 95.131-95.302l-.172.172zM52.14 168.697c11.182-19.268 28.557-34.062 49.544-41.803V247.14c0 6.02 3.097 11.354 8.258 14.45l118.354 68.295-43.695 25.288-97.711-56.425c-45.415-26.32-61.07-84.465-34.75-130.052zm26.665 220.71c-11.182-19.095-15.139-41.802-11.354-63.65.688.516 2.064 1.204 2.924 1.72l101.152 58.49a16.965 16.965 0 0016.687 0l118.354-68.467v50.232l-97.883 56.425c-45.587 26.148-103.732 10.665-130.052-34.75h.172zm204.54 87.39c-22.192 0-43.867-7.741-60.898-22.02a62.439 62.439 0 003.097-1.72l101.152-58.317c5.16-2.924 8.429-8.43 8.257-14.45V243.527l43.523 25.116v113.022c0 52.64-42.663 95.303-95.131 95.303v-.172zM461.22 343.303c-11.182 19.267-28.729 34.061-49.544 41.63V264.687c0-6.021-3.097-11.526-8.257-14.45L284.893 181.77l43.523-25.116l97.883 56.424c45.587 26.32 61.07 84.466 34.75 130.053l.172.172z" fill-rule="nonzero"/></svg>