2026-04-18 23:02:18 +00:00
131 changed files with 2228 additions and 1663 deletions
--- a/.claude/commands/post-release-testing.md
+++ b/.claude/commands/post-release-testing.md
@ -43,7 +43,7 @@ Manually verify the install script works in a fresh environment:
 ```bash
 docker run --rm alpine:latest sh -c "
  apk add --no-cache curl ca-certificates libstdc++ libgcc bash &&
-  curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh &&
+  curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh &&
  sandbox-agent --version
 "
 ```
--- a/CLAUDE.md
+++ b/CLAUDE.md
@ -20,7 +20,7 @@
 - For HTTP/CLI docs/examples, source of truth is:
  - `server/packages/sandbox-agent/src/router.rs`
  - `server/packages/sandbox-agent/src/cli.rs`
- Keep docs aligned to implemented endpoints/commands only (for example ACP under `/v1/acp`, not legacy session REST APIs).
+- Keep docs aligned to implemented endpoints/commands only (for example ACP under `/v1/acp`, not legacy `/v1/sessions` APIs).

 ## Change Tracking

@ -78,3 +78,4 @@
  - `scripts/release/main.ts`
  - `scripts/release/promote-artifacts.ts`
  - `scripts/release/sdk.ts`
+  - `scripts/sandbox-testing/test-sandbox.ts`
--- a/Cargo.toml
+++ b/Cargo.toml
@ -4,7 +4,7 @@ members = ["server/packages/*", "gigacode"]
 exclude = ["factory/packages/desktop/src-tauri", "foundry/packages/desktop/src-tauri"]

 [workspace.package]
-version = "0.4.2"
+version = "0.5.0-rc.1"
 edition = "2021"
 authors = [ "Rivet Gaming, LLC <developer@rivet.gg>" ]
 license = "Apache-2.0"
@ -13,13 +13,13 @@ description = "Universal API for automatic coding agents in sandboxes. Supports

 [workspace.dependencies]
 # Internal crates
-sandbox-agent = { version = "0.4.2", path = "server/packages/sandbox-agent" }
-sandbox-agent-error = { version = "0.4.2", path = "server/packages/error" }
-sandbox-agent-agent-management = { version = "0.4.2", path = "server/packages/agent-management" }
-sandbox-agent-agent-credentials = { version = "0.4.2", path = "server/packages/agent-credentials" }
-sandbox-agent-opencode-adapter = { version = "0.4.2", path = "server/packages/opencode-adapter" }
-sandbox-agent-opencode-server-manager = { version = "0.4.2", path = "server/packages/opencode-server-manager" }
-acp-http-adapter = { version = "0.4.2", path = "server/packages/acp-http-adapter" }
+sandbox-agent = { version = "0.5.0-rc.1", path = "server/packages/sandbox-agent" }
+sandbox-agent-error = { version = "0.5.0-rc.1", path = "server/packages/error" }
+sandbox-agent-agent-management = { version = "0.5.0-rc.1", path = "server/packages/agent-management" }
+sandbox-agent-agent-credentials = { version = "0.5.0-rc.1", path = "server/packages/agent-credentials" }
+sandbox-agent-opencode-adapter = { version = "0.5.0-rc.1", path = "server/packages/opencode-adapter" }
+sandbox-agent-opencode-server-manager = { version = "0.5.0-rc.1", path = "server/packages/opencode-server-manager" }
+acp-http-adapter = { version = "0.5.0-rc.1", path = "server/packages/acp-http-adapter" }

 # Serialization
 serde = { version = "1.0", features = ["derive"] }
--- a/README.md
+++ b/README.md
@ -80,11 +80,11 @@ Import the SDK directly into your Node or browser application. Full type safety
 **Install**

 ```bash
-npm install sandbox-agent@0.4.x
+npm install sandbox-agent@0.3.x
 ```

 ```bash
-bun add sandbox-agent@0.4.x
+bun add sandbox-agent@0.3.x
 # Optional: allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
 bun pm trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
 ```
@ -135,7 +135,7 @@ Run as an HTTP server and connect from any language. Deploy to E2B, Daytona, Ver

 ```bash
 # Install it
-curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
 # Run it
 sandbox-agent server --token "$SANDBOX_TOKEN" --host 127.0.0.1 --port 2468
 ```
@ -159,12 +159,12 @@ sandbox-agent server --no-token --host 127.0.0.1 --port 2468
 Install the CLI wrapper (optional but convenient):

 ```bash
-npm install -g @sandbox-agent/cli@0.4.x
+npm install -g @sandbox-agent/cli@0.3.x
 ```

 ```bash
 # Allow Bun to run postinstall scripts for native binaries.
-bun add -g @sandbox-agent/cli@0.4.x
+bun add -g @sandbox-agent/cli@0.3.x
 bun pm -g trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
 ```

@ -179,11 +179,11 @@ sandbox-agent api sessions send-message-stream my-session --message "Hello" --en
 You can also use npx like:

 ```bash
-npx @sandbox-agent/cli@0.4.x --help
+npx @sandbox-agent/cli@0.3.x --help
 ```

 ```bash
-bunx @sandbox-agent/cli@0.4.x --help
+bunx @sandbox-agent/cli@0.3.x --help
 ```

 [CLI documentation](https://sandboxagent.dev/docs/cli)
--- a/docs/agent-sessions.mdx
+++ b/docs/agent-sessions.mdx
@ -51,108 +51,6 @@ await session.prompt([
 unsubscribe();
 ```

-### Event types
-
-Each event's `payload` contains a session update. The `sessionUpdate` field identifies the type.
-
-<AccordionGroup>
-<Accordion title="agent_message_chunk">
-Streamed text or content from the agent's response.
-
-```json
-{
-  "sessionUpdate": "agent_message_chunk",
-  "content": { "type": "text", "text": "Here's how the repository is structured..." }
-}
-```
-</Accordion>
-
-<Accordion title="agent_thought_chunk">
-Internal reasoning from the agent (chain-of-thought / extended thinking).
-
-```json
-{
-  "sessionUpdate": "agent_thought_chunk",
-  "content": { "type": "text", "text": "I should start by looking at the project structure..." }
-}
-```
-</Accordion>
-
-<Accordion title="user_message_chunk">
-Echo of the user's prompt being processed.
-
-```json
-{
-  "sessionUpdate": "user_message_chunk",
-  "content": { "type": "text", "text": "Summarize the repository structure." }
-}
-```
-</Accordion>
-
-<Accordion title="tool_call">
-The agent invoked a tool (file edit, terminal command, etc.).
-
-```json
-{
-  "sessionUpdate": "tool_call",
-  "toolCallId": "tc_abc123",
-  "title": "Read file",
-  "status": "in_progress",
-  "rawInput": { "path": "/src/index.ts" }
-}
-```
-</Accordion>
-
-<Accordion title="tool_call_update">
-Progress or result update for an in-progress tool call.
-
-```json
-{
-  "sessionUpdate": "tool_call_update",
-  "toolCallId": "tc_abc123",
-  "status": "completed",
-  "content": [{ "type": "text", "text": "import express from 'express';\n..." }]
-}
-```
-</Accordion>
-
-<Accordion title="plan">
-The agent's execution plan for the current task.
-
-```json
-{
-  "sessionUpdate": "plan",
-  "entries": [
-    { "content": "Read the project structure", "status": "completed" },
-    { "content": "Identify main entrypoints", "status": "in_progress" },
-    { "content": "Write summary", "status": "pending" }
-  ]
-}
-```
-</Accordion>
-
-<Accordion title="usage_update">
-Token usage metrics for the current turn.
-
-```json
-{
-  "sessionUpdate": "usage_update"
-}
-```
-</Accordion>
-
-<Accordion title="session_info_update">
-Session metadata changed (e.g. agent-generated title).
-
-```json
-{
-  "sessionUpdate": "session_info_update",
-  "title": "Repository structure analysis"
-}
-```
-</Accordion>
-</AccordionGroup>
-
 ## Fetch persisted event history

 ```ts
--- a/docs/architecture.mdx
+++ b/docs/architecture.mdx
@ -56,7 +56,7 @@ Agents are installed lazily on first use. To avoid the cold-start delay, pre-ins
 sandbox-agent install-agent --all
 ```

-The `rivetdev/sandbox-agent:0.4.2-full` Docker image ships with all agents pre-installed.
+The `rivetdev/sandbox-agent:0.5.0-rc.1-full` Docker image ships with all agents pre-installed.

 ## Production-ready agent orchestration

--- a/docs/deploy/boxlite.mdx
+++ b/docs/deploy/boxlite.mdx
@ -20,7 +20,7 @@ that BoxLite can load directly (BoxLite has its own image store separate from Do
 ```dockerfile
 FROM node:22-bookworm-slim
 RUN apt-get update && apt-get install -y curl ca-certificates && rm -rf /var/lib/apt/lists/*
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
 RUN sandbox-agent install-agent claude
 RUN sandbox-agent install-agent codex
 ```
--- a/docs/deploy/cloudflare.mdx
+++ b/docs/deploy/cloudflare.mdx
@ -25,7 +25,7 @@ cd my-sandbox
 ```dockerfile
 FROM cloudflare/sandbox:0.7.0

-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
 RUN sandbox-agent install-agent claude && sandbox-agent install-agent codex

 EXPOSE 8000
@ -36,7 +36,7 @@ EXPOSE 8000
 For standalone scripts, use the `cloudflare` provider:

 ```bash
-npm install sandbox-agent@0.4.x @cloudflare/sandbox
+npm install sandbox-agent@0.3.x @cloudflare/sandbox
 ```

 ```typescript
--- a/docs/deploy/computesdk.mdx
+++ b/docs/deploy/computesdk.mdx
@ -14,7 +14,7 @@ description: "Deploy Sandbox Agent using ComputeSDK's provider-agnostic sandbox
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.4.x computesdk
+npm install sandbox-agent@0.3.x computesdk
 ```

 ```typescript
@ -27,11 +27,7 @@ if (process.env.OPENAI_API_KEY) envs.OPENAI_API_KEY = process.env.OPENAI_API_KEY

 const sdk = await SandboxAgent.start({
  sandbox: computesdk({
-    create: {
-      envs,
-      image: process.env.COMPUTESDK_IMAGE,
-      templateId: process.env.COMPUTESDK_TEMPLATE_ID,
-    },
+    create: { envs },
  }),
 });

@ -47,7 +43,6 @@ try {
 ```

 The `computesdk` provider handles sandbox creation, Sandbox Agent installation, agent setup, and server startup automatically. ComputeSDK routes to your configured provider behind the scenes.
-The `create` option now forwards the full ComputeSDK sandbox-create payload, including provider-specific fields such as `image` and `templateId` when the selected provider supports them.

 Before calling `SandboxAgent.start()`, configure ComputeSDK with your provider:

--- a/docs/deploy/daytona.mdx
+++ b/docs/deploy/daytona.mdx
@ -16,7 +16,7 @@ See [Daytona network limits](https://www.daytona.io/docs/en/network-limits/).
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.4.x @daytonaio/sdk
+npm install sandbox-agent@0.3.x @daytonaio/sdk
 ```

 ```typescript
@ -44,7 +44,7 @@ try {
 }
 ```

-The `daytona` provider uses the `rivetdev/sandbox-agent:0.4.2-full` image by default and starts the server automatically.
+The `daytona` provider uses the `rivetdev/sandbox-agent:0.5.0-rc.1-full` image by default and starts the server automatically.

 ## Using snapshots for faster startup

@ -61,7 +61,7 @@ if (!hasSnapshot) {
    name: SNAPSHOT,
    image: Image.base("ubuntu:22.04").runCommands(
      "apt-get update && apt-get install -y curl ca-certificates",
-      "curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh",
+      "curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh",
      "sandbox-agent install-agent claude",
      "sandbox-agent install-agent codex",
    ),
--- a/docs/deploy/docker.mdx
+++ b/docs/deploy/docker.mdx
@ -15,11 +15,11 @@ Run the published full image with all supported agents pre-installed:
 docker run --rm -p 3000:3000 \
  -e ANTHROPIC_API_KEY="$ANTHROPIC_API_KEY" \
  -e OPENAI_API_KEY="$OPENAI_API_KEY" \
-  rivetdev/sandbox-agent:0.4.2-full \
+  rivetdev/sandbox-agent:0.5.0-rc.1-full \
  server --no-token --host 0.0.0.0 --port 3000
 ```

-The `0.4.2-full` tag pins the exact version. The moving `full` tag is also published for contributors who want the latest full image.
+The `0.5.0-rc.1-full` tag pins the exact version. The moving `full` tag is also published for contributors who want the latest full image.

 If you also want the desktop API inside the container, install desktop dependencies before starting the server:

@ -31,7 +31,7 @@ docker run --rm -p 3000:3000 \
    apt-get update && \
    DEBIAN_FRONTEND=noninteractive apt-get install -y curl ca-certificates bash libstdc++6 && \
    rm -rf /var/lib/apt/lists/* && \
-    curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh && \
+    curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh && \
    sandbox-agent install desktop --yes && \
    sandbox-agent server --no-token --host 0.0.0.0 --port 3000"
 ```
@ -52,7 +52,7 @@ const docker = new Docker();
 const PORT = 3000;

 const container = await docker.createContainer({
-  Image: "rivetdev/sandbox-agent:0.4.2-full",
+  Image: "rivetdev/sandbox-agent:0.5.0-rc.1-full",
  Cmd: ["server", "--no-token", "--host", "0.0.0.0", "--port", `${PORT}`],
  Env: [
    `ANTHROPIC_API_KEY=${process.env.ANTHROPIC_API_KEY}`,
@ -86,7 +86,7 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
    bash ca-certificates curl git && \
    rm -rf /var/lib/apt/lists/*

-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh && \
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh && \
    sandbox-agent install-agent --all

 RUN useradd -m -s /bin/bash sandbox
--- a/docs/deploy/e2b.mdx
+++ b/docs/deploy/e2b.mdx
@ -11,7 +11,7 @@ description: "Deploy Sandbox Agent inside an E2B sandbox."
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.4.x @e2b/code-interpreter
+npm install sandbox-agent@0.3.x @e2b/code-interpreter
 ```

 ```typescript
@ -21,11 +21,9 @@ import { e2b } from "sandbox-agent/e2b";
 const envs: Record<string, string> = {};
 if (process.env.ANTHROPIC_API_KEY) envs.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
 if (process.env.OPENAI_API_KEY) envs.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
-const template = process.env.E2B_TEMPLATE;

 const sdk = await SandboxAgent.start({
  sandbox: e2b({
-    template,
    create: { envs },
  }),
 });
@ -43,10 +41,7 @@ try {

 The `e2b` provider handles sandbox creation, Sandbox Agent installation, agent setup, and server startup automatically. Sandboxes pause by default instead of being deleted, and reconnecting with the same `sandboxId` resumes them automatically.

-Pass `template` when you want to start from a custom E2B template alias or template ID. E2B base-image selection happens when you build the template, then `sandbox-agent/e2b` uses that template at sandbox creation time.
-
 ## Faster cold starts

 For faster startup, create a custom E2B template with Sandbox Agent and target agents pre-installed.
-Build System 2.0 also lets you choose the template's base image in code.
-See [E2B Custom Templates](https://e2b.dev/docs/sandbox-template) and [E2B Base Images](https://e2b.dev/docs/template/base-image).
+See [E2B Custom Templates](https://e2b.dev/docs/sandbox-template).
--- a/docs/deploy/foundry-self-hosting.mdx
+++ b/docs/deploy/foundry-self-hosting.mdx
@ -0,0 +1,155 @@
+---
+title: "Foundry Self-Hosting"
+description: "Environment, credentials, and deployment setup for Sandbox Agent Foundry auth, GitHub, and billing."
+---
+
+This guide documents the deployment contract for the Foundry product surface: app auth, GitHub onboarding, repository import, and billing.
+
+It also covers the local-development bootstrap that uses `.env.development` only when `NODE_ENV=development`.
+
+## Local Development
+
+For backend local development, the Foundry backend now supports a development-only dotenv bootstrap:
+
+- It loads `.env.development.local` and `.env.development`
+- It does this **only** when `NODE_ENV=development`
+- It does **not** load dotenv files in production
+
+The example file lives at [`/.env.development.example`](https://github.com/rivet-dev/sandbox-agent/blob/main/.env.development.example).
+
+To use it locally:
+
+```bash
+cp .env.development.example .env.development
+```
+
+Run the backend with:
+
+```bash
+just foundry-backend-start
+```
+
+That recipe sets `NODE_ENV=development`, which enables the dotenv loader.
+
+### Local Defaults
+
+These values can be safely defaulted for local development:
+
+- `APP_URL=http://localhost:4173`
+- `BETTER_AUTH_URL=http://localhost:7741`
+- `BETTER_AUTH_SECRET=sandbox-agent-foundry-development-only-change-me`
+- `GITHUB_REDIRECT_URI=http://localhost:7741/v1/auth/callback/github`
+
+These should be treated as development-only values.
+
+## Production Environment
+
+For production or self-hosting, set these as real environment variables in your deployment platform. Do not rely on dotenv file loading.
+
+### App/Auth
+
+| Variable | Required | Notes |
+|---|---:|---|
+| `APP_URL` | Yes | Public frontend origin |
+| `BETTER_AUTH_URL` | Yes | Public auth base URL |
+| `BETTER_AUTH_SECRET` | Yes | Strong random secret for auth/session signing |
+
+### GitHub OAuth
+
+| Variable | Required | Notes |
+|---|---:|---|
+| `GITHUB_CLIENT_ID` | Yes | GitHub OAuth app client id |
+| `GITHUB_CLIENT_SECRET` | Yes | GitHub OAuth app client secret |
+| `GITHUB_REDIRECT_URI` | Yes | GitHub OAuth callback URL |
+
+Use GitHub OAuth for:
+
+- user sign-in
+- user identity
+- org selection
+- access to the signed-in user’s GitHub context
+
+## GitHub App
+
+If your Foundry deployment uses GitHub App-backed organization install and repo import, also configure:
+
+| Variable | Required | Notes |
+|---|---:|---|
+| `GITHUB_APP_ID` | Yes | GitHub App id |
+| `GITHUB_APP_CLIENT_ID` | Yes | GitHub App client id |
+| `GITHUB_APP_CLIENT_SECRET` | Yes | GitHub App client secret |
+| `GITHUB_APP_PRIVATE_KEY` | Yes | PEM private key for installation auth |
+
+For `.env.development` and `.env.development.local`, store `GITHUB_APP_PRIVATE_KEY` as a quoted single-line value with `\n` escapes instead of raw multi-line PEM text.
+
+Recommended GitHub App permissions:
+
+- Repository `Metadata: Read`
+- Repository `Contents: Read & Write`
+- Repository `Pull requests: Read & Write`
+- Repository `Checks: Read`
+- Repository `Commit statuses: Read`
+
+Set the webhook URL to `https://<your-backend-host>/v1/webhooks/github` and generate a webhook secret. Store the secret as `GITHUB_WEBHOOK_SECRET`.
+
+This is required, not optional. Foundry depends on GitHub App webhook delivery for installation lifecycle changes, repo access changes, and ongoing repo / pull request sync. If the GitHub App is not installed for the workspace, or webhook delivery is misconfigured, Foundry will remain in an install / reconnect state and core GitHub-backed functionality will not work correctly.
+
+Recommended webhook subscriptions:
+
+- `installation`
+- `installation_repositories`
+- `pull_request`
+- `pull_request_review`
+- `pull_request_review_comment`
+- `push`
+- `create`
+- `delete`
+- `check_suite`
+- `check_run`
+- `status`
+
+Use the GitHub App for:
+
+- installation/reconnect state
+- org repo import
+- repository sync
+- PR creation and updates
+
+Use GitHub OAuth for:
+
+- who the user is
+- which orgs they can choose
+
+## Stripe
+
+For live billing, configure:
+
+| Variable | Required | Notes |
+|---|---:|---|
+| `STRIPE_SECRET_KEY` | Yes | Server-side Stripe secret key |
+| `STRIPE_PUBLISHABLE_KEY` | Yes | Client-side Stripe publishable key |
+| `STRIPE_WEBHOOK_SECRET` | Yes | Signing secret for billing webhooks |
+| `STRIPE_PRICE_TEAM` | Yes | Stripe price id for the Team plan checkout session |
+
+Stripe should own:
+
+- hosted checkout
+- billing portal
+- subscription status
+- invoice history
+- webhook-driven state sync
+
+## Mock Invariant
+
+Foundry’s mock client path should continue to work end to end even when the real auth/GitHub/Stripe path exists.
+
+That includes:
+
+- sign-in
+- org selection/import
+- settings
+- billing UI
+- workspace/task/session flow
+- seat accrual
+
+Use mock mode for deterministic UI review and local product development. Use the real env-backed path for integration and self-hosting.
--- a/docs/deploy/local.mdx
+++ b/docs/deploy/local.mdx
@ -9,7 +9,7 @@ For local development, run Sandbox Agent directly on your machine.

 ```bash
 # Install
-curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh

 # Run
 sandbox-agent server --no-token --host 127.0.0.1 --port 2468
@ -20,12 +20,12 @@ Or with npm/Bun:
 <Tabs>
  <Tab title="npx">
    ```bash
-    npx @sandbox-agent/cli@0.4.x server --no-token --host 127.0.0.1 --port 2468
+    npx @sandbox-agent/cli@0.3.x server --no-token --host 127.0.0.1 --port 2468
    ```
  </Tab>
  <Tab title="bunx">
    ```bash
-    bunx @sandbox-agent/cli@0.4.x server --no-token --host 127.0.0.1 --port 2468
+    bunx @sandbox-agent/cli@0.3.x server --no-token --host 127.0.0.1 --port 2468
    ```
  </Tab>
 </Tabs>
--- a/docs/deploy/modal.mdx
+++ b/docs/deploy/modal.mdx
@ -11,7 +11,7 @@ description: "Deploy Sandbox Agent inside a Modal sandbox."
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.4.x modal
+npm install sandbox-agent@0.3.x modal
 ```

 ```typescript
@ -21,11 +21,9 @@ import { modal } from "sandbox-agent/modal";
 const secrets: Record<string, string> = {};
 if (process.env.ANTHROPIC_API_KEY) secrets.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
 if (process.env.OPENAI_API_KEY) secrets.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
-const baseImage = process.env.MODAL_BASE_IMAGE ?? "node:22-slim";

 const sdk = await SandboxAgent.start({
  sandbox: modal({
-    image: baseImage,
    create: { secrets },
  }),
 });
@ -42,7 +40,6 @@ try {
 ```

 The `modal` provider handles app creation, image building, sandbox provisioning, agent installation, server startup, and tunnel networking automatically.
-Set `image` to change the base Docker image before Sandbox Agent and its agent binaries are layered on top. You can also pass a prebuilt Modal `Image` object.

 ## Faster cold starts

--- a/docs/deploy/vercel.mdx
+++ b/docs/deploy/vercel.mdx
@ -11,7 +11,7 @@ description: "Deploy Sandbox Agent inside a Vercel Sandbox."
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.4.x @vercel/sandbox
+npm install sandbox-agent@0.3.x @vercel/sandbox
 ```

 ```typescript
--- a/docs/docs.json
+++ b/docs/docs.json
@ -1,6 +1,6 @@
 {
  "$schema": "https://mintlify.com/docs.json",
-  "theme": "mint",
+  "theme": "willow",
  "name": "Sandbox Agent SDK",
  "appearance": {
    "default": "dark",
@ -8,8 +8,8 @@
  },
  "colors": {
    "primary": "#ff4f00",
-    "light": "#ff6a2a",
-    "dark": "#cc3f00"
+    "light": "#ff4f00",
+    "dark": "#ff4f00"
  },
  "favicon": "/favicon.svg",
  "logo": {
@ -25,13 +25,17 @@
  },
  "navbar": {
    "links": [
+      {
+        "label": "Gigacode",
+        "icon": "terminal",
+        "href": "https://github.com/rivet-dev/sandbox-agent/tree/main/gigacode"
+      },
      {
        "label": "Discord",
        "icon": "discord",
        "href": "https://discord.gg/auCecybynK"
      },
      {
-        "label": "GitHub",
        "type": "github",
        "href": "https://github.com/rivet-dev/sandbox-agent"
      }
@ -85,10 +89,13 @@
            "group": "System",
            "pages": ["file-system", "processes", "computer-use", "common-software"]
          },
+          {
+            "group": "Orchestration",
+            "pages": ["orchestration-architecture", "session-persistence", "observability", "multiplayer", "security"]
+          },
          {
            "group": "Reference",
            "pages": [
-              "troubleshooting",
              "architecture",
              "cli",
              "inspector",
@ -120,11 +127,5 @@
        ]
      }
    ]
-  },
-  "__removed": [
-	  {
-		"group": "Orchestration",
-		"pages": ["orchestration-architecture", "session-persistence", "observability", "multiplayer", "security"]
-	  }
-  ]
+  }
 }
--- a/docs/gigacode.mdx
+++ b/docs/gigacode.mdx
@ -0,0 +1,6 @@
+---
+title: Gigacode
+url: "https://github.com/rivet-dev/sandbox-agent/tree/main/gigacode"
+---
+
+
--- a/docs/openapi.json
+++ b/docs/openapi.json
@ -10,7 +10,7 @@
    "license": {
      "name": "Apache-2.0"
    },
-    "version": "0.4.2"
+    "version": "0.5.0-rc.1"
  },
  "servers": [
    {
--- a/docs/pi-support-plan.md
+++ b/docs/pi-support-plan.md
@ -0,0 +1,210 @@
+# Pi Agent Support Plan (pi-mono)
+
+## Implementation Status Update
+
+- Runtime selection now supports two internal modes:
+  - `PerSession` (default for unknown/non-allowlisted Pi capabilities)
+  - `Shared` (allowlist-only compatibility path)
+- Pi sessions now use per-session process isolation by default, enabling true concurrent Pi sessions in Inspector and API clients.
+- Shared Pi server code remains available and is used only when capability checks allow multiplexing.
+- Session termination for per-session Pi mode hard-kills the underlying Pi process and clears queued prompts/pending waiters.
+- In-session concurrent sends are serialized with an unbounded daemon-side FIFO queue per session.
+
+## Investigation Summary
+
+### Pi CLI modes and RPC protocol
+- Pi supports multiple modes including interactive, print/JSON output, RPC, and SDK usage. JSON mode outputs a stream of JSON events suitable for parsing, and RPC mode is intended for programmatic control over stdin/stdout.
+- RPC mode is started with `pi --mode rpc` and supports options like `--provider`, `--model`, `--no-session`, and `--session-dir`.
+- The RPC protocol is newline-delimited JSON over stdin/stdout:
+  - Commands are JSON objects written to stdin.
+  - Responses are JSON objects with `type: "response"` and optional `id`.
+  - Events are JSON objects without `id`.
+- `prompt` can include images using `ImageContent` (base64 or URL) alongside text.
+- JSON/print mode (`pi -p` or `pi --print --mode json`) produces JSONL for non-interactive parsing and can resume sessions with a token.
+
+### RPC commands
+RPC commands listed in `rpc.md` include:
+- `new_session`, `get_state`, `list_sessions`, `delete_session`, `rename_session`, `clear_session`
+- `prompt`, `queue_message`, `abort`, `get_queued_messages`
+
+### RPC event types
+RPC events listed in `rpc.md` include:
+- `agent_start`, `agent_end`
+- `turn_start`, `turn_end`
+- `message_start`, `message_update`, `message_end`
+- `tool_execution_start`, `tool_execution_update`, `tool_execution_end`
+- `auto_compaction`, `auto_retry`, `hook_error`
+
+`message_update` uses `assistantMessageEvent` deltas such as:
+- `start`, `text_start`, `text_delta`, `text_end`
+- `thinking_start`, `thinking_delta`, `thinking_end`
+- `toolcall_start`, `toolcall_delta`, `toolcall_end`
+- `toolcall_args_start`, `toolcall_args_delta`, `toolcall_args_end`
+- `done`, `error`
+
+`tool_execution_update` includes `partialResult`, which is described as accumulated output so far.
+
+### Schema source locations (pi-mono)
+RPC types are documented as living in:
+- `packages/ai/src/types.ts` (Model types)
+- `packages/agent/src/types.ts` (AgentResponse types)
+- `packages/coding-agent/src/core/messages.ts` (message types)
+- `packages/coding-agent/src/modes/rpc/rpc-types.ts` (RPC protocol types)
+
+### Distribution assets
+Pi releases provide platform-specific binaries such as:
+- `pi-darwin-arm64`, `pi-darwin-x64`
+- `pi-linux-arm64`, `pi-linux-x64`
+- `pi-win-x64.zip`
+
+## Integration Decisions
+- Follow the OpenCode pattern: a shared long-running process (stdio RPC) with session multiplexing.
+- Primary integration path is RPC streaming (`pi --mode rpc`).
+- JSON/print mode is a fallback only (diagnostics or non-interactive runs).
+- Create sessions via `new_session`; store the returned `sessionId` as `native_session_id`.
+- Use `get_state` as a re-sync path after server restarts.
+- Use `prompt` for send-message, with optional image content.
+- Convert Pi events into universal events; emit daemon synthetic `session.started` on session creation and `session.ended` only on errors/termination.
+
+## Implementation Plan
+
+### 1) Agent Identity + Capabilities
+Files:
+- `server/packages/agent-management/src/agents.rs`
+- `server/packages/sandbox-agent/src/router.rs`
+- `docs/cli.mdx`, `docs/conversion.mdx`, `docs/session-transcript-schema.mdx`
+- `README.md`, `frontend/packages/website/src/components/FAQ.tsx`
+
+Tasks:
+- Add `AgentId::Pi` with string/binary name `"pi"` and parsing rules.
+- Add Pi to `all_agents()` and agent lists.
+- Define `AgentCapabilities` for Pi:
+  - `tool_calls=true`, `tool_results=true`
+  - `text_messages=true`, `streaming_deltas=true`, `item_started=true`
+  - `reasoning=true` (from `thinking_*` deltas)
+  - `images=true` (ImageContent in `prompt`)
+  - `permissions=false`, `questions=false`, `mcp_tools=false`
+  - `shared_process=true`, `session_lifecycle=false` (no native session events)
+  - `error_events=true` (hook_error)
+  - `command_execution=false`, `file_changes=false`, `file_attachments=false`
+
+### 2) Installer and Binary Resolution
+Files:
+- `server/packages/agent-management/src/agents.rs`
+
+Tasks:
+- Add `install_pi()` that:
+  - Downloads the correct release asset per platform (`pi-<platform>`).
+  - Handles `.zip` on Windows and raw binaries elsewhere.
+  - Marks binary executable.
+- Add Pi to `AgentManager::install`, `is_installed`, `version`.
+- Version detection: try `--version`, `version`, `-V`.
+
+### 3) Schema Extraction for Pi
+Files:
+- `resources/agent-schemas/src/pi.ts` (new)
+- `resources/agent-schemas/src/index.ts`
+- `resources/agent-schemas/artifacts/json-schema/pi.json`
+- `server/packages/extracted-agent-schemas/build.rs`
+- `server/packages/extracted-agent-schemas/src/lib.rs`
+
+Tasks:
+- Implement `extractPiSchema()`:
+  - Download pi-mono sources (zip/tarball) into a temp dir.
+  - Use `ts-json-schema-generator` against `packages/coding-agent/src/modes/rpc/rpc-types.ts`.
+  - Include dependent files per `rpc.md` (ai/types, agent/types, core/messages).
+  - Extract `RpcEvent`, `RpcResponse`, `RpcCommand` unions (exact type names from source).
+- Add fallback schema if remote fetch fails (minimal union with event/response fields).
+- Wire pi into extractor index and artifact generation.
+
+### 4) Universal Schema Conversion (Pi -> Universal)
+Files:
+- `server/packages/universal-agent-schema/src/agents/pi.rs` (new)
+- `server/packages/universal-agent-schema/src/agents/mod.rs`
+- `server/packages/universal-agent-schema/src/lib.rs`
+- `server/packages/sandbox-agent/src/router.rs`
+
+Mapping rules:
+- `message_start` -> `item.started` (kind=message, role=assistant, native_item_id=messageId)
+- `message_update`:
+  - `text_*` -> `item.delta` (assistant text delta)
+  - `thinking_*` -> `item.delta` with `ContentPart::Reasoning` (visibility=Private)
+  - `toolcall_*` and `toolcall_args_*` -> ignore for now (tool_execution_* is authoritative)
+  - `error` -> `item.completed` with `ItemStatus::Failed` (if no later message_end)
+- `message_end` -> `item.completed` (finalize assistant message)
+- `tool_execution_start` -> `item.started` (kind=tool_call, ContentPart::ToolCall)
+- `tool_execution_update` -> `item.delta` for a synthetic tool_result item:
+  - Maintain a per-toolCallId buffer to compute delta from accumulated `partialResult`.
+- `tool_execution_end` -> `item.completed` (kind=tool_result, output from `result.content`)
+  - If `isError=true`, set item status to failed.
+- `agent_start`, `turn_start`, `turn_end`, `agent_end`, `auto_compaction`, `auto_retry`, `hook_error`:
+  - Map to `ItemKind::Status` with a label like `pi.agent_start`, `pi.auto_retry`, etc.
+  - Do not emit `session.ended` for these events.
+- If event parsing fails, emit `agent.unparsed` (source=daemon, synthetic=true) and fail tests.
+
+### 5) Shared RPC Server Integration
+Files:
+- `server/packages/sandbox-agent/src/router.rs`
+
+Tasks:
+- Add a new managed stdio server type for Pi, similar to Codex:
+  - Create `PiServer` struct with:
+    - stdin sender
+    - pending request map keyed by request id
+    - per-session native session id mapping
+  - Extend `ManagedServerKind` to include Pi.
+  - Add `ensure_pi_server()` and `spawn_pi_server()` using `pi --mode rpc`.
+  - Add a `handle_pi_server_output()` loop to parse stdout lines into events/responses.
+- Session creation:
+  - On `create_session`, ensure Pi server is running, send `new_session`, store sessionId.
+  - Register session with `server_manager.register_session` for native mapping.
+- Sending messages:
+  - Use `prompt` command; include sessionId and optional images.
+  - Emit synthetic `item.started` only if Pi does not emit `message_start`.
+
+### 6) Router + Streaming Path Changes
+Files:
+- `server/packages/sandbox-agent/src/router.rs`
+
+Tasks:
+- Add Pi handling to:
+  - `create_session` (new_session)
+  - `send_message` (prompt)
+  - `parse_agent_line` (Pi event conversion)
+  - `agent_modes` (default to `default` unless Pi exposes a mode list)
+  - `agent_supports_resume` (true if Pi supports session resume)
+
+### 7) Tests
+Files:
+- `server/packages/sandbox-agent/tests/...`
+- `server/packages/universal-agent-schema/tests/...` (if present)
+
+Tasks:
+- Unit tests for conversion:
+  - `message_start/update/end` -> item.started/delta/completed
+  - `tool_execution_*` -> tool call/result mapping with partialResult delta
+  - failure -> agent.unparsed
+- Integration tests:
+  - Start Pi RPC server, create session, send prompt, stream events.
+  - Validate `native_session_id` mapping and event ordering.
+- Update HTTP/SSE test coverage to include Pi agent if relevant.
+
+## Risk Areas / Edge Cases
+- `tool_execution_update.partialResult` is cumulative; must compute deltas.
+- `message_update` may emit `done`/`error` without `message_end`; handle both paths.
+- No native session lifecycle events; rely on daemon synthetic events.
+- Session recovery after RPC server restart requires `get_state` + re-register sessions.
+
+## Acceptance Criteria
+- Pi appears in `/v1/agents`, CLI list, and docs.
+- `create_session` returns `native_session_id` from Pi `new_session`.
+- Streaming prompt yields universal events with proper ordering:
+  - message -> item.started/delta/completed
+  - tool execution -> tool call + tool result
+- Tests pass and no synthetic data is used in test fixtures.
+
+## Sources
+- https://upd.dev/badlogic/pi-mono/src/commit/d36e0ea07303d8a76d51b4a7bd5f0d6d3c490860/packages/coding-agent/docs/rpc.md
+- https://buildwithpi.ai/pi-cli
+- https://takopi.dev/docs/pi-cli/
+- https://upd.dev/badlogic/pi-mono/releases
--- a/docs/quickstart.mdx
+++ b/docs/quickstart.mdx
@ -64,7 +64,7 @@ icon: "rocket"
        docker run -p 2468:2468 \
          -e ANTHROPIC_API_KEY="sk-ant-..." \
          -e OPENAI_API_KEY="sk-..." \
-          rivetdev/sandbox-agent:0.4.2-full \
+          rivetdev/sandbox-agent:0.5.0-rc.1-full \
          server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>
@ -89,7 +89,7 @@ icon: "rocket"
        Install and run the binary directly.

        ```bash
-        curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+        curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
        sandbox-agent server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>
@ -98,7 +98,7 @@ icon: "rocket"
        Run without installing globally.

        ```bash
-        npx @sandbox-agent/cli@0.4.x server --no-token --host 0.0.0.0 --port 2468
+        npx @sandbox-agent/cli@0.3.x server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>

@ -106,7 +106,7 @@ icon: "rocket"
        Run without installing globally.

        ```bash
-        bunx @sandbox-agent/cli@0.4.x server --no-token --host 0.0.0.0 --port 2468
+        bunx @sandbox-agent/cli@0.3.x server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>

@ -114,7 +114,7 @@ icon: "rocket"
        Install globally, then run.

        ```bash
-        npm install -g @sandbox-agent/cli@0.4.x
+        npm install -g @sandbox-agent/cli@0.3.x
        sandbox-agent server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>
@ -123,7 +123,7 @@ icon: "rocket"
        Install globally, then run.

        ```bash
-        bun add -g @sandbox-agent/cli@0.4.x
+        bun add -g @sandbox-agent/cli@0.3.x
        # Allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
        bun pm -g trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
        sandbox-agent server --no-token --host 0.0.0.0 --port 2468
@ -134,7 +134,7 @@ icon: "rocket"
        For local development, use `SandboxAgent.start()` to spawn and manage the server as a subprocess.

        ```bash
-        npm install sandbox-agent@0.4.x
+        npm install sandbox-agent@0.3.x
        ```

        ```typescript
@ -148,7 +148,7 @@ icon: "rocket"
        For local development, use `SandboxAgent.start()` to spawn and manage the server as a subprocess.

        ```bash
-        bun add sandbox-agent@0.4.x
+        bun add sandbox-agent@0.3.x
        # Allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
        bun pm trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
        ```
--- a/docs/react-components.mdx
+++ b/docs/react-components.mdx
@ -17,7 +17,7 @@ Current exports:
 ## Install

 ```bash
-npm install @sandbox-agent/react@0.4.x
+npm install @sandbox-agent/react@0.3.x
 ```

 ## Full example
--- a/docs/sdk-overview.mdx
+++ b/docs/sdk-overview.mdx
@ -11,12 +11,12 @@ The TypeScript SDK is centered on `sandbox-agent` and its `SandboxAgent` class.
 <Tabs>
  <Tab title="npm">
    ```bash
-    npm install sandbox-agent@0.4.x
+    npm install sandbox-agent@0.3.x
    ```
  </Tab>
  <Tab title="bun">
    ```bash
-    bun add sandbox-agent@0.4.x
+    bun add sandbox-agent@0.3.x
    # Allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
    bun pm trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
    ```
@ -26,7 +26,7 @@ The TypeScript SDK is centered on `sandbox-agent` and its `SandboxAgent` class.
 ## Optional React components

 ```bash
-npm install @sandbox-agent/react@0.4.x
+npm install @sandbox-agent/react@0.3.x
 ```

 ## Create a client
--- a/docs/session-transcript-schema.mdx
+++ b/docs/session-transcript-schema.mdx
@ -0,0 +1,388 @@
+---
+title: "Session Transcript Schema"
+description: "Universal event schema for session transcripts across all agents."
+---
+
+Each coding agent outputs events in its own native format. The sandbox-agent converts these into a universal event schema, giving you a consistent session transcript regardless of which agent you use.
+
+The schema is defined in [OpenAPI format](https://github.com/rivet-dev/sandbox-agent/blob/main/docs/openapi.json). See the [HTTP API Reference](/api-reference) for endpoint documentation.
+
+## Coverage Matrix
+
+This table shows which agent feature coverage appears in the universal event stream. All agents retain their full native feature coverage—this only reflects what's normalized into the schema.
+
+| Feature            | Claude | Codex | OpenCode     | Amp          | Pi (RPC)     |
+|--------------------|:------:|:-----:|:------------:|:------------:|:------------:|
+| Stability          | Stable | Stable| Experimental | Experimental | Experimental |
+| Text Messages      |   ✓    |   ✓   |      ✓       |      ✓       |      ✓       |
+| Tool Calls         |   ✓    |   ✓   |      ✓       |      ✓       |      ✓       |
+| Tool Results       |   ✓    |   ✓   |      ✓       |      ✓       |      ✓       |
+| Questions (HITL)   |   ✓    |       |      ✓       |              |              |
+| Permissions (HITL) |   ✓    |   ✓   |      ✓       |      -       |              |
+| Images             |   -    |   ✓   |      ✓       |      -       |      ✓       |
+| File Attachments   |   -    |   ✓   |      ✓       |      -       |              |
+| Session Lifecycle  |   -    |   ✓   |      ✓       |      -       |              |
+| Error Events       |   -    |   ✓   |      ✓       |      ✓       |      ✓       |
+| Reasoning/Thinking |   -    |   ✓   |      -       |      -       |      ✓       |
+| Command Execution  |   -    |   ✓   |      -       |      -       |              |
+| File Changes       |   -    |   ✓   |      -       |      -       |              |
+| MCP Tools          |   ✓    |   ✓   |      ✓       |      ✓       |              |
+| Streaming Deltas   |   ✓    |   ✓   |      ✓       |      -       |      ✓       |
+| Variants           |        |   ✓   |      ✓       |      ✓       |      ✓       |
+
+Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview) · [Codex](https://github.com/openai/codex) · [OpenCode](https://github.com/opencode-ai/opencode) · [Amp](https://ampcode.com) · [Pi](https://buildwithpi.ai/pi-cli)
+
+- ✓ = Appears in session events
+- \- = Agent supports natively, schema conversion coming soon
+- (blank) = Not supported by agent
+- Pi runtime model is router-managed per-session RPC (`pi --mode rpc`); it does not use generic subprocess streaming.
+
+<AccordionGroup>
+  <Accordion title="Text Messages">
+    Basic message exchange between user and assistant.
+  </Accordion>
+  <Accordion title="Tool Calls & Results">
+    Visibility into tool invocations (file reads, command execution, etc.) and their results. When not natively supported, tool activity is embedded in message content.
+  </Accordion>
+  <Accordion title="Questions (HITL)">
+    Interactive questions the agent asks the user. Emits `question.requested` and `question.resolved` events.
+  </Accordion>
+  <Accordion title="Permissions (HITL)">
+    Permission requests for sensitive operations. Emits `permission.requested` and `permission.resolved` events.
+  </Accordion>
+  <Accordion title="Images">
+    Support for image attachments in messages.
+  </Accordion>
+  <Accordion title="File Attachments">
+    Support for file attachments in messages.
+  </Accordion>
+  <Accordion title="Session Lifecycle">
+    Native `session.started` and `session.ended` events. When not supported, the daemon emits synthetic lifecycle events.
+  </Accordion>
+  <Accordion title="Error Events">
+    Structured error events for runtime failures.
+  </Accordion>
+  <Accordion title="Reasoning/Thinking">
+    Extended thinking or reasoning content with visibility controls.
+  </Accordion>
+  <Accordion title="Command Execution">
+    Detailed command execution events with stdout/stderr.
+  </Accordion>
+  <Accordion title="File Changes">
+    Structured file modification events with diffs.
+  </Accordion>
+  <Accordion title="MCP Tools">
+    Model Context Protocol tool support.
+  </Accordion>
+  <Accordion title="Streaming Deltas">
+    Native streaming of content deltas. When not supported, the daemon emits a single synthetic delta before `item.completed`.
+  </Accordion>
+  <Accordion title="Variants">
+    Model variants such as reasoning effort or depth. Agents may expose different variant sets per model.
+  </Accordion>
+</AccordionGroup>
+
+Want support for another agent? [Open an issue](https://github.com/rivet-dev/sandbox-agent/issues/new) to request it.
+
+## UniversalEvent
+
+Every event from the API is wrapped in a `UniversalEvent` envelope.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `event_id` | string | Unique identifier for this event |
+| `sequence` | integer | Monotonic sequence number within the session (starts at 1) |
+| `time` | string | RFC3339 timestamp |
+| `session_id` | string | Daemon-generated session identifier |
+| `native_session_id` | string? | Provider-native session/thread identifier (e.g., Codex `threadId`, OpenCode `sessionID`) |
+| `source` | string | Event origin: `agent` (native) or `daemon` (synthetic) |
+| `synthetic` | boolean | Whether this event was generated by the daemon to fill gaps |
+| `type` | string | Event type (see [Event Types](#event-types)) |
+| `data` | object | Event-specific payload |
+| `raw` | any? | Original provider payload (only when `include_raw=true`) |
+
+```json
+{
+  "event_id": "evt_abc123",
+  "sequence": 1,
+  "time": "2025-01-28T12:00:00Z",
+  "session_id": "my-session",
+  "native_session_id": "thread_xyz",
+  "source": "agent",
+  "synthetic": false,
+  "type": "item.completed",
+  "data": { ... }
+}
+```
+
+## Event Types
+
+### Session Lifecycle
+
+| Type | Description | Data |
+|------|-------------|------|
+| `session.started` | Session has started | `{ metadata?: any }` |
+| `session.ended` | Session has ended | `{ reason, terminated_by, message?, exit_code? }` |
+
+### Turn Lifecycle
+
+| Type | Description | Data |
+|------|-------------|------|
+| `turn.started` | Turn has started | `{ phase: "started", turn_id?, metadata? }` |
+| `turn.ended` | Turn has ended | `{ phase: "ended", turn_id?, metadata? }` |
+
+**SessionEndedData**
+
+| Field | Type | Values |
+|-------|------|--------|
+| `reason` | string | `completed`, `error`, `terminated` |
+| `terminated_by` | string | `agent`, `daemon` |
+| `message` | string? | Error message (only present when reason is `error`) |
+| `exit_code` | int? | Process exit code (only present when reason is `error`) |
+| `stderr` | StderrOutput? | Structured stderr output (only present when reason is `error`) |
+
+**StderrOutput**
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `head` | string? | First 20 lines of stderr (if truncated) or full stderr (if not truncated) |
+| `tail` | string? | Last 50 lines of stderr (only present if truncated) |
+| `truncated` | boolean | Whether the output was truncated |
+| `total_lines` | int? | Total number of lines in stderr |
+
+### Item Lifecycle
+
+| Type | Description | Data |
+|------|-------------|------|
+| `item.started` | Item creation | `{ item }` |
+| `item.delta` | Streaming content delta | `{ item_id, native_item_id?, delta }` |
+| `item.completed` | Item finalized | `{ item }` |
+
+Items follow a consistent lifecycle: `item.started` → `item.delta` (0 or more) → `item.completed`.
+
+### HITL (Human-in-the-Loop)
+
+| Type | Description | Data |
+|------|-------------|------|
+| `permission.requested` | Permission request pending | `{ permission_id, action, status, metadata? }` |
+| `permission.resolved` | Permission decision recorded | `{ permission_id, action, status, metadata? }` |
+| `question.requested` | Question pending user input | `{ question_id, prompt, options, status }` |
+| `question.resolved` | Question answered or rejected | `{ question_id, prompt, options, status, response? }` |
+
+**PermissionEventData**
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `permission_id` | string | Identifier for the permission request |
+| `action` | string | What the agent wants to do |
+| `status` | string | `requested`, `accept`, `accept_for_session`, `reject` |
+| `metadata` | any? | Additional context |
+
+**QuestionEventData**
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `question_id` | string | Identifier for the question |
+| `prompt` | string | Question text |
+| `options` | string[] | Available answer options |
+| `status` | string | `requested`, `answered`, `rejected` |
+| `response` | string? | Selected answer (when resolved) |
+
+### Errors
+
+| Type | Description | Data |
+|------|-------------|------|
+| `error` | Runtime error | `{ message, code?, details? }` |
+| `agent.unparsed` | Parse failure | `{ error, location, raw_hash? }` |
+
+The `agent.unparsed` event indicates the daemon failed to parse an agent payload. This should be treated as a bug.
+
+## UniversalItem
+
+Items represent discrete units of content within a session.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `item_id` | string | Daemon-generated identifier |
+| `native_item_id` | string? | Provider-native item/message identifier |
+| `parent_id` | string? | Parent item ID (e.g., tool call/result parented to a message) |
+| `kind` | string | Item category (see below) |
+| `role` | string? | Actor role for message items |
+| `status` | string | Lifecycle status |
+| `content` | ContentPart[] | Ordered list of content parts |
+
+### ItemKind
+
+| Value | Description |
+|-------|-------------|
+| `message` | User or assistant message |
+| `tool_call` | Tool invocation |
+| `tool_result` | Tool execution result |
+| `system` | System message |
+| `status` | Status update |
+| `unknown` | Unrecognized item type |
+
+### ItemRole
+
+| Value | Description |
+|-------|-------------|
+| `user` | User message |
+| `assistant` | Assistant response |
+| `system` | System prompt |
+| `tool` | Tool-related message |
+
+### ItemStatus
+
+| Value | Description |
+|-------|-------------|
+| `in_progress` | Item is streaming or pending |
+| `completed` | Item is finalized |
+| `failed` | Item execution failed |
+
+## Content Parts
+
+The `content` array contains typed parts that make up an item's payload.
+
+### text
+
+Plain text content.
+
+```json
+{ "type": "text", "text": "Hello, world!" }
+```
+
+### json
+
+Structured JSON content.
+
+```json
+{ "type": "json", "json": { "key": "value" } }
+```
+
+### tool_call
+
+Tool invocation.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `name` | string | Tool name |
+| `arguments` | string | JSON-encoded arguments |
+| `call_id` | string | Unique call identifier |
+
+```json
+{
+  "type": "tool_call",
+  "name": "read_file",
+  "arguments": "{\"path\": \"/src/main.ts\"}",
+  "call_id": "call_abc123"
+}
+```
+
+### tool_result
+
+Tool execution result.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `call_id` | string | Matching call identifier |
+| `output` | string | Tool output |
+
+```json
+{
+  "type": "tool_result",
+  "call_id": "call_abc123",
+  "output": "File contents here..."
+}
+```
+
+### file_ref
+
+File reference with optional diff.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `path` | string | File path |
+| `action` | string | `read`, `write`, `patch` |
+| `diff` | string? | Unified diff (for patches) |
+
+```json
+{
+  "type": "file_ref",
+  "path": "/src/main.ts",
+  "action": "write",
+  "diff": "@@ -1,3 +1,4 @@\n+import { foo } from 'bar';"
+}
+```
+
+### image
+
+Image reference.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `path` | string | Image file path |
+| `mime` | string? | MIME type |
+
+```json
+{ "type": "image", "path": "/tmp/screenshot.png", "mime": "image/png" }
+```
+
+### reasoning
+
+Model reasoning/thinking content.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `text` | string | Reasoning text |
+| `visibility` | string | `public` or `private` |
+
+```json
+{ "type": "reasoning", "text": "Let me think about this...", "visibility": "public" }
+```
+
+### status
+
+Status indicator.
+
+| Field | Type | Description |
+|-------|------|-------------|
+| `label` | string | Status label |
+| `detail` | string? | Additional detail |
+
+```json
+{ "type": "status", "label": "Running tests", "detail": "3 of 10 passed" }
+```
+
+## Source & Synthetics
+
+### EventSource
+
+The `source` field indicates who emitted the event:
+
+| Value | Description |
+|-------|-------------|
+| `agent` | Native event from the agent |
+| `daemon` | Synthetic event generated by the daemon |
+
+### Synthetic Events
+
+The daemon emits synthetic events (`synthetic: true`, `source: "daemon"`) to provide a consistent event stream across all agents. Common synthetics:
+
+| Synthetic | When |
+|-----------|------|
+| `session.started` | Agent doesn't emit explicit session start |
+| `session.ended` | Agent doesn't emit explicit session end |
+| `turn.started` | Agent doesn't emit explicit turn start |
+| `turn.ended` | Agent doesn't emit explicit turn end |
+| `item.started` | Agent doesn't emit item start events |
+| `item.delta` | Agent doesn't stream deltas natively |
+| `question.*` | Claude Code plan mode (from ExitPlanMode tool) |
+
+### Raw Payloads
+
+Pass `include_raw=true` to event endpoints to receive the original agent payload in the `raw` field. Useful for debugging or accessing agent-specific data not in the universal schema.
+
+```typescript
+const events = await client.getEvents("my-session", { includeRaw: true });
+// events[0].raw contains the original agent payload
+```
--- a/docs/theme.css
+++ b/docs/theme.css
@ -20,6 +20,7 @@ body {
  color: var(--sa-text);
 }

+/*
 a {
  color: var(--sa-primary);
 }
@ -40,13 +41,6 @@ select {
  color: var(--sa-text);
 }

-code,
-pre {
-  background-color: var(--sa-card);
-  border: 1px solid var(--sa-border);
-  color: var(--sa-text);
-}
-
 .card,
 .mintlify-card,
 .docs-card {
@ -70,3 +64,4 @@ pre {
 .alert-danger {
  border-color: var(--sa-danger);
 }
+*/
--- a/docs/troubleshooting.mdx
+++ b/docs/troubleshooting.mdx
@ -29,6 +29,25 @@ Verify the agent is installed:
 ls -la ~/.local/share/sandbox-agent/bin/
 ```

+### 4. Binary libc mismatch (musl vs glibc)
+
+Claude Code binaries are available in both musl and glibc variants. If you see errors like:
+
+```
+cannot execute: required file not found
+Error loading shared library libstdc++.so.6: No such file or directory
+```
+
+This means the wrong binary variant was downloaded.
+
+**For sandbox-agent 0.2.0+**: Platform detection is automatic. The correct binary (musl or glibc) is downloaded based on the runtime environment.
+
+**For sandbox-agent 0.1.x**: Use Alpine Linux which has native musl support:
+
+```dockerfile
+FROM alpine:latest
+RUN apk add --no-cache curl ca-certificates libstdc++ libgcc bash
+```

 ## Daytona Network Restrictions

--- a/examples/boxlite-python/Dockerfile
+++ b/examples/boxlite-python/Dockerfile
@ -1,5 +1,5 @@
 FROM node:22-bookworm-slim
 RUN apt-get update && apt-get install -y curl ca-certificates && rm -rf /var/lib/apt/lists/*
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
 RUN sandbox-agent install-agent claude
 RUN sandbox-agent install-agent codex
--- a/examples/boxlite/Dockerfile
+++ b/examples/boxlite/Dockerfile
@ -1,5 +1,5 @@
 FROM node:22-bookworm-slim
 RUN apt-get update && apt-get install -y curl ca-certificates && rm -rf /var/lib/apt/lists/*
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
 RUN sandbox-agent install-agent claude
 RUN sandbox-agent install-agent codex
--- a/examples/boxlite/tsconfig.json
+++ b/examples/boxlite/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/cloudflare/Dockerfile
+++ b/examples/cloudflare/Dockerfile
@ -1,7 +1,7 @@
 FROM cloudflare/sandbox:0.7.0

 # Install sandbox-agent
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh

 # Pre-install agents
 RUN sandbox-agent install-agent claude && \
--- a/examples/computesdk/tsconfig.json
+++ b/examples/computesdk/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/daytona/src/index.ts
+++ b/examples/daytona/src/index.ts
@ -16,6 +16,7 @@ console.log(`UI: ${client.inspectorUrl}`);

 const session = await client.createSession({
  agent: detectAgent(),
+  cwd: "/home/daytona",
 });

 session.onEvent((event) => {
--- a/examples/daytona/tsconfig.json
+++ b/examples/daytona/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/docker/tsconfig.json
+++ b/examples/docker/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/e2b/src/e2b.ts
+++ b/examples/e2b/src/e2b.ts
@ -17,10 +17,8 @@ export async function setupE2BSandboxAgent(): Promise<{
  token?: string;
  cleanup: () => Promise<void>;
 }> {
-  const template = process.env.E2B_TEMPLATE;
  const client = await SandboxAgent.start({
    sandbox: e2b({
-      template,
      create: { envs: collectEnvVars() },
    }),
  });
--- a/examples/e2b/src/index.ts
+++ b/examples/e2b/src/index.ts
@ -5,15 +5,15 @@ import { detectAgent } from "@sandbox-agent/example-shared";
 const envs: Record<string, string> = {};
 if (process.env.ANTHROPIC_API_KEY) envs.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
 if (process.env.OPENAI_API_KEY) envs.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
-const template = process.env.E2B_TEMPLATE;

 const client = await SandboxAgent.start({
  // ✨ NEW ✨
-  sandbox: e2b({ template, create: { envs } }),
+  sandbox: e2b({ create: { envs } }),
 });

 const session = await client.createSession({
  agent: detectAgent(),
+  cwd: "/home/user",
 });

 session.onEvent((event) => {
--- a/examples/e2b/tsconfig.json
+++ b/examples/e2b/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/file-system/tsconfig.json
+++ b/examples/file-system/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/mcp-custom-tool/tsconfig.json
+++ b/examples/mcp-custom-tool/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/mcp/tsconfig.json
+++ b/examples/mcp/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/modal/tsconfig.json
+++ b/examples/modal/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/permissions/tsconfig.json
+++ b/examples/permissions/tsconfig.json
@ -1,8 +1,7 @@
 {
  "compilerOptions": {
    "target": "ES2022",
-    "lib": ["ES2022", "DOM"],
-    "types": ["node"],
+    "lib": ["ES2022"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
--- a/examples/persist-memory/tsconfig.json
+++ b/examples/persist-memory/tsconfig.json
@ -1,15 +1,13 @@
 {
  "compilerOptions": {
    "target": "ES2022",
-    "lib": ["ES2022", "DOM"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
    "noEmit": true,
    "esModuleInterop": true,
    "strict": true,
-    "skipLibCheck": true,
-    "types": ["node"]
+    "skipLibCheck": true
  },
  "include": ["src"]
 }
--- a/examples/persist-postgres/tsconfig.json
+++ b/examples/persist-postgres/tsconfig.json
@ -1,15 +1,13 @@
 {
  "compilerOptions": {
    "target": "ES2022",
-    "lib": ["ES2022", "DOM"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
    "noEmit": true,
    "esModuleInterop": true,
    "strict": true,
-    "skipLibCheck": true,
-    "types": ["node"]
+    "skipLibCheck": true
  },
  "include": ["src"]
 }
--- a/examples/persist-sqlite/tsconfig.json
+++ b/examples/persist-sqlite/tsconfig.json
@ -1,15 +1,13 @@
 {
  "compilerOptions": {
    "target": "ES2022",
-    "lib": ["ES2022", "DOM"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
    "noEmit": true,
    "esModuleInterop": true,
    "strict": true,
-    "skipLibCheck": true,
-    "types": ["node"]
+    "skipLibCheck": true
  },
  "include": ["src"]
 }
--- a/examples/shared/src/docker.ts
+++ b/examples/shared/src/docker.ts
@ -9,7 +9,7 @@ const __dirname = path.dirname(fileURLToPath(import.meta.url));
 const REPO_ROOT = path.resolve(__dirname, "..", "..", "..");

 /** Pre-built Docker image with all agents installed. */
-export const FULL_IMAGE = "rivetdev/sandbox-agent:0.4.2-full";
+export const FULL_IMAGE = "rivetdev/sandbox-agent:0.5.0-rc.1-full";

 export interface DockerSandboxOptions {
  /** Container port used by sandbox-agent inside Docker. */
--- a/examples/skills-custom-tool/tsconfig.json
+++ b/examples/skills-custom-tool/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/skills/tsconfig.json
+++ b/examples/skills/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/sprites/package.json
+++ b/examples/sprites/package.json
@ -1,20 +0,0 @@
-{
-  "name": "@sandbox-agent/example-sprites",
-  "private": true,
-  "type": "module",
-  "scripts": {
-    "start": "tsx src/index.ts",
-    "typecheck": "tsc --noEmit"
-  },
-  "dependencies": {
-    "@fly/sprites": "latest",
-    "@sandbox-agent/example-shared": "workspace:*",
-    "sandbox-agent": "workspace:*"
-  },
-  "devDependencies": {
-    "@types/node": "latest",
-    "tsx": "latest",
-    "typescript": "latest",
-    "vitest": "^3.0.0"
-  }
-}
--- a/examples/sprites/src/index.ts
+++ b/examples/sprites/src/index.ts
@ -1,21 +0,0 @@
-import { SandboxAgent } from "sandbox-agent";
-import { sprites } from "sandbox-agent/sprites";
-
-const env: Record<string, string> = {};
-if (process.env.ANTHROPIC_API_KEY) env.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
-if (process.env.OPENAI_API_KEY) env.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
-
-const client = await SandboxAgent.start({
-  sandbox: sprites({
-    token: process.env.SPRITES_API_KEY ?? process.env.SPRITE_TOKEN ?? process.env.SPRITES_TOKEN,
-    env,
-  }),
-});
-
-console.log(`UI: ${client.inspectorUrl}`);
-console.log(await client.getHealth());
-
-process.once("SIGINT", async () => {
-  await client.destroySandbox();
-  process.exit(0);
-});
--- a/examples/sprites/tests/sprites.test.ts
+++ b/examples/sprites/tests/sprites.test.ts
@ -1,34 +0,0 @@
-import { describe, it, expect } from "vitest";
-import { SandboxAgent } from "sandbox-agent";
-import { sprites } from "sandbox-agent/sprites";
-
-const shouldRun = Boolean(process.env.SPRITES_API_KEY || process.env.SPRITE_TOKEN || process.env.SPRITES_TOKEN);
-const timeoutMs = Number.parseInt(process.env.SANDBOX_TEST_TIMEOUT_MS || "", 10) || 300_000;
-
-const testFn = shouldRun ? it : it.skip;
-
-describe("sprites provider", () => {
-  testFn(
-    "starts sandbox-agent and responds to /v1/health",
-    async () => {
-      const env: Record<string, string> = {};
-      if (process.env.ANTHROPIC_API_KEY) env.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
-      if (process.env.OPENAI_API_KEY) env.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
-
-      const sdk = await SandboxAgent.start({
-        sandbox: sprites({
-          token: process.env.SPRITES_API_KEY ?? process.env.SPRITE_TOKEN ?? process.env.SPRITES_TOKEN,
-          env,
-        }),
-      });
-
-      try {
-        const health = await sdk.getHealth();
-        expect(health.status).toBe("ok");
-      } finally {
-        await sdk.destroySandbox();
-      }
-    },
-    timeoutMs,
-  );
-});
--- a/examples/sprites/tsconfig.json
+++ b/examples/sprites/tsconfig.json
@ -1,17 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "ES2022",
-    "lib": ["ES2022", "DOM"],
-    "module": "ESNext",
-    "moduleResolution": "Bundler",
-    "allowImportingTsExtensions": true,
-    "noEmit": true,
-    "esModuleInterop": true,
-    "strict": true,
-    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
-  },
-  "include": ["src/**/*"],
-  "exclude": ["node_modules", "**/*.test.ts"]
-}
--- a/examples/vercel/src/index.ts
+++ b/examples/vercel/src/index.ts
@ -19,6 +19,7 @@ console.log(`UI: ${client.inspectorUrl}`);

 const session = await client.createSession({
  agent: detectAgent(),
+  cwd: "/home/vercel-sandbox",
 });

 session.onEvent((event) => {
--- a/examples/vercel/tsconfig.json
+++ b/examples/vercel/tsconfig.json
@ -9,8 +9,7 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true,
-    "types": ["node"]
+    "resolveJsonModule": true
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/foundry/CLAUDE.md
+++ b/foundry/CLAUDE.md
@ -72,26 +72,6 @@ Local Docker sandboxes use the `rivetdev/sandbox-agent:foundry-base-latest` imag
 - The image must be built with `--platform linux/amd64`. The Rust build is memory-intensive; Docker Desktop needs at least 8GB RAM allocated.
 - When updating the base image contents (new system packages, agent versions), rebuild and push with the publish script, then update the `foundry-base-latest` tag.

-## Production GitHub App + OAuth App
-
-Foundry uses two separate GitHub entities in production:
-
- **OAuth App** (`GITHUB_CLIENT_ID` / `GITHUB_CLIENT_SECRET`) — handles "Sign in with GitHub" via Better Auth. This is a standard OAuth App.
- **GitHub App** (`GITHUB_APP_ID` / `GITHUB_APP_CLIENT_ID` / `GITHUB_APP_CLIENT_SECRET` / `GITHUB_APP_PRIVATE_KEY`) — handles webhooks, installation tokens for repo access, and GitHub API sync (repos, PRs). Must be manually installed on each org.
-
-Key env vars and where they connect:
-
- `GITHUB_REDIRECT_URI` — OAuth callback, must point to `https://api.sandboxagent.dev/v1/auth/callback/github`
- `GITHUB_WEBHOOK_SECRET` — must match the secret configured on the GitHub App's Webhook settings page exactly. Mismatches cause silent 500s on webhook delivery (signature verification fails inside the actor, surfaced as a generic RivetKit `internal_error`).
- `BETTER_AUTH_URL` — must be the **API** URL (`https://api.sandboxagent.dev`), not the frontend URL. Better Auth uses this internally for sign-out and session management calls.
- `APP_URL` — the **frontend** URL (`https://foundry.sandboxagent.dev`).
-
-Troubleshooting:
-
- **"GitHub App not installed"** — The GitHub App must be manually installed on each org. Sign-in does not auto-install it. Go to the GitHub App settings → Install App tab. The sign-in flow can only detect existing installations, not create them.
- **Webhooks not arriving** — Check the GitHub App → Advanced tab for delivery history. If deliveries show 500, the webhook secret likely doesn't match `GITHUB_WEBHOOK_SECRET`. Test with: `echo -n '{"test":true}' | openssl dgst -sha256 -hmac "$SECRET"` and curl the endpoint with the computed signature.
- **Deleting all actors wipes GitHub App installation state.** After a full actor reset, you must trigger a webhook (e.g. redeliver from GitHub App Advanced tab, or re-install the app) to repopulate installation records.
-
 ## Railway Logs

 - Production Foundry Railway logs can be read from a linked checkout with `railway logs --deployment --lines 200` or `railway logs <deployment-id> --deployment --lines 200`.
--- a/foundry/docker/backend.Dockerfile
+++ b/foundry/docker/backend.Dockerfile
@ -19,7 +19,6 @@ RUN pnpm --filter @sandbox-agent/foundry-backend deploy --prod /out
 FROM oven/bun:1.2 AS runtime
 ENV NODE_ENV=production
 ENV HOME=/home/task
-ENV RIVET_RUNNER_VERSION_FILE=/etc/foundry/rivet-runner-version
 WORKDIR /app
 RUN apt-get update \
  && apt-get install -y --no-install-recommends \
@ -32,8 +31,6 @@ RUN addgroup --system --gid 1001 task \
  && adduser --system --uid 1001 --home /home/task --ingroup task task \
  && mkdir -p /home/task \
  && chown -R task:task /home/task /app
-RUN mkdir -p /etc/foundry \
-  && date +%s > /etc/foundry/rivet-runner-version
 COPY --from=build /out ./
 USER task
 EXPOSE 7741
--- a/foundry/docker/backend.dev.Dockerfile
+++ b/foundry/docker/backend.dev.Dockerfile
@ -21,9 +21,6 @@ RUN curl -fsSL "https://releases.rivet.dev/sandbox-agent/${SANDBOX_AGENT_VERSION

 ENV PATH="/root/.local/bin:${PATH}"
 ENV SANDBOX_AGENT_BIN="/root/.local/bin/sandbox-agent"
-ENV RIVET_RUNNER_VERSION_FILE=/etc/foundry/rivet-runner-version
-RUN mkdir -p /etc/foundry \
-  && date +%s > /etc/foundry/rivet-runner-version

 WORKDIR /app

--- a/foundry/docker/backend.preview.Dockerfile
+++ b/foundry/docker/backend.preview.Dockerfile
@ -20,9 +20,6 @@ RUN curl -fsSL "https://releases.rivet.dev/sandbox-agent/${SANDBOX_AGENT_VERSION

 ENV PATH="/root/.local/bin:${PATH}"
 ENV SANDBOX_AGENT_BIN="/root/.local/bin/sandbox-agent"
-ENV RIVET_RUNNER_VERSION_FILE=/etc/foundry/rivet-runner-version
-RUN mkdir -p /etc/foundry \
-  && date +%s > /etc/foundry/rivet-runner-version

 WORKDIR /workspace/quebec

--- a/foundry/packages/backend/src/actors/index.ts
+++ b/foundry/packages/backend/src/actors/index.ts
@ -6,15 +6,16 @@ import { auditLog } from "./audit-log/index.js";
 import { taskSandbox } from "./sandbox/index.js";
 import { organization } from "./organization/index.js";
 import { logger } from "../logging.js";
-import { resolveRunnerVersion } from "../config/runner-version.js";

-const runnerVersion = resolveRunnerVersion();
+const RUNNER_VERSION = Math.floor(Date.now() / 1000);

 export const registry = setup({
  serverless: {
    basePath: "/v1/rivet",
  },
-  runner: { version: runnerVersion },
+  runner: {
+    version: RUNNER_VERSION,
+  },
  logging: {
    baseLogger: logger,
  },
--- a/foundry/packages/backend/src/actors/logging.ts
+++ b/foundry/packages/backend/src/actors/logging.ts
@ -22,16 +22,6 @@ export function resolveErrorStack(error: unknown): string | undefined {
  return undefined;
 }

-export function logActorInfo(scope: string, message: string, context?: Record<string, unknown>): void {
-  logger.info(
-    {
-      scope,
-      ...(context ?? {}),
-    },
-    message,
-  );
-}
-
 export function logActorWarning(scope: string, message: string, context?: Record<string, unknown>): void {
  logger.warn(
    {
--- a/foundry/packages/backend/src/actors/sandbox/index.ts
+++ b/foundry/packages/backend/src/actors/sandbox/index.ts
@ -13,12 +13,7 @@ import { logActorWarning, resolveErrorMessage } from "../logging.js";
 import { expectQueueResponse } from "../../services/queue.js";
 import { resolveSandboxProviderId } from "../../sandbox-config.js";

-/**
- * Default repo CWD inside the sandbox. The actual path is resolved dynamically
- * via `$HOME/repo` because different sandbox providers run as different users
- * (e.g. E2B uses `/home/user`, local Docker uses `/home/sandbox`).
- */
-const DEFAULT_SANDBOX_REPO_CWD = "/home/user/repo";
+const SANDBOX_REPO_CWD = "/home/sandbox/repo";
 const DEFAULT_LOCAL_SANDBOX_IMAGE = "rivetdev/sandbox-agent:foundry-base-latest";
 const DEFAULT_LOCAL_SANDBOX_PORT = 2468;
 const dockerClient = new Dockerode({ socketPath: "/var/run/docker.sock" });
@ -212,7 +207,7 @@ const baseTaskSandbox = sandboxActor({
    if (sandboxProviderId === "e2b") {
      return e2b({
        create: () => ({
-          template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.5.x",
+          template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.3.x",
          envs: sandboxEnvObject(),
          // TEMPORARY: Default E2B timeout is 5 minutes which is too short.
          // Set to 1 hour as a stopgap. Remove this once the E2B provider in
@ -269,7 +264,7 @@ async function providerForConnection(c: any): Promise<any | null> {
    sandboxProviderId === "e2b"
      ? e2b({
          create: () => ({
-            template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.5.x",
+            template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.3.x",
            envs: sandboxEnvObject(),
          }),
          installAgents: ["claude", "codex"],
@ -302,43 +297,6 @@ async function listWorkspaceModelGroupsForSandbox(c: any): Promise<WorkspaceMode

 const baseActions = baseTaskSandbox.config.actions as Record<string, (c: any, ...args: any[]) => Promise<any>>;

-// ---------------------------------------------------------------------------
-// Dynamic repo CWD resolution
-// ---------------------------------------------------------------------------
-
-let cachedRepoCwd: string | null = null;
-
-/**
- * Resolve the repo CWD inside the sandbox by querying `$HOME`.
- * Different providers run as different users (E2B: `/home/user`, local Docker:
- * `/home/sandbox`), so the path must be resolved dynamically. The result is
- * cached for the lifetime of this sandbox actor instance.
- */
-async function resolveRepoCwd(c: any): Promise<string> {
-  if (cachedRepoCwd) return cachedRepoCwd;
-
-  try {
-    const result = await baseActions.runProcess(c, {
-      command: "bash",
-      args: ["-lc", "echo $HOME"],
-      cwd: "/",
-      timeoutMs: 10_000,
-    });
-    const home = (result.stdout ?? result.result ?? "").trim();
-    if (home && home.startsWith("/")) {
-      cachedRepoCwd = `${home}/repo`;
-      return cachedRepoCwd;
-    }
-  } catch (error) {
-    logActorWarning("taskSandbox", "failed to resolve $HOME, using default", {
-      error: resolveErrorMessage(error),
-    });
-  }
-
-  cachedRepoCwd = DEFAULT_SANDBOX_REPO_CWD;
-  return cachedRepoCwd;
-}
-
 // ---------------------------------------------------------------------------
 // Queue names for sandbox actor
 // ---------------------------------------------------------------------------
@ -570,9 +528,8 @@ export const taskSandbox = actor({
      }
    },

-    async repoCwd(c: any): Promise<{ cwd: string }> {
-      const resolved = await resolveRepoCwd(c);
-      return { cwd: resolved };
+    async repoCwd(): Promise<{ cwd: string }> {
+      return { cwd: SANDBOX_REPO_CWD };
    },

    // Long-running action — kept as direct action to avoid blocking the
@ -643,4 +600,4 @@ export const taskSandbox = actor({
  run: workflow(runSandboxWorkflow),
 });

-export { DEFAULT_SANDBOX_REPO_CWD, resolveRepoCwd };
+export { SANDBOX_REPO_CWD };
--- a/foundry/packages/backend/src/actors/task/workspace.ts
+++ b/foundry/packages/backend/src/actors/task/workspace.ts
@ -1,6 +1,6 @@
 // @ts-nocheck
 import { randomUUID } from "node:crypto";
-import { basename } from "node:path";
+import { basename, dirname } from "node:path";
 import { asc, eq } from "drizzle-orm";
 import {
  DEFAULT_WORKSPACE_MODEL_GROUPS,
@ -10,7 +10,8 @@ import {
 } from "@sandbox-agent/foundry-shared";
 import { getActorRuntimeContext } from "../context.js";
 import { getOrCreateOrganization, getOrCreateTaskSandbox, getOrCreateUser, getTaskSandbox, selfTask } from "../handles.js";
-import { logActorInfo, logActorWarning, resolveErrorMessage } from "../logging.js";
+import { logActorWarning, resolveErrorMessage } from "../logging.js";
+import { SANDBOX_REPO_CWD } from "../sandbox/index.js";
 import { resolveSandboxProviderId } from "../../sandbox-config.js";
 import { getBetterAuthService } from "../../services/better-auth.js";
 import { resolveOrganizationGithubAuth } from "../../services/github-auth.js";
@ -182,9 +183,9 @@ async function injectGitCredentials(sandbox: any, login: string, email: string,
    "set -euo pipefail",
    `git config --global user.name ${JSON.stringify(login)}`,
    `git config --global user.email ${JSON.stringify(email)}`,
-    `git config --global credential.helper 'store --file=$HOME/.git-token'`,
-    `printf '%s\\n' ${JSON.stringify(`https://${login}:${token}@github.com`)} > $HOME/.git-token`,
-    `chmod 600 $HOME/.git-token`,
+    `git config --global credential.helper 'store --file=/home/sandbox/.git-token'`,
+    `printf '%s\\n' ${JSON.stringify(`https://${login}:${token}@github.com`)} > /home/sandbox/.git-token`,
+    `chmod 600 /home/sandbox/.git-token`,
  ];
  const result = await sandbox.runProcess({
    command: "bash",
@ -575,10 +576,6 @@ async function getTaskSandboxRuntime(
  const sandbox = await getOrCreateTaskSandbox(c, c.state.organizationId, sandboxId, {});
  const actorId = typeof sandbox.resolve === "function" ? await sandbox.resolve().catch(() => null) : null;
  const switchTarget = sandboxProviderId === "local" ? `sandbox://local/${sandboxId}` : `sandbox://e2b/${sandboxId}`;
-
-  // Resolve the actual repo CWD from the sandbox's $HOME (differs by provider).
-  const repoCwdResult = await sandbox.repoCwd();
-  const cwd = repoCwdResult?.cwd ?? "$HOME/repo";
  const now = Date.now();

  await c.db
@ -588,7 +585,7 @@ async function getTaskSandboxRuntime(
      sandboxProviderId,
      sandboxActorId: typeof actorId === "string" ? actorId : null,
      switchTarget,
-      cwd,
+      cwd: SANDBOX_REPO_CWD,
      createdAt: now,
      updatedAt: now,
    })
@ -598,7 +595,7 @@ async function getTaskSandboxRuntime(
        sandboxProviderId,
        sandboxActorId: typeof actorId === "string" ? actorId : null,
        switchTarget,
-        cwd,
+        cwd: SANDBOX_REPO_CWD,
        updatedAt: now,
      },
    })
@ -609,7 +606,7 @@ async function getTaskSandboxRuntime(
    .set({
      activeSandboxId: sandboxId,
      activeSwitchTarget: switchTarget,
-      activeCwd: cwd,
+      activeCwd: SANDBOX_REPO_CWD,
      updatedAt: now,
    })
    .where(eq(taskRuntime.id, 1))
@ -620,7 +617,7 @@ async function getTaskSandboxRuntime(
    sandboxId,
    sandboxProviderId,
    switchTarget,
-    cwd,
+    cwd: SANDBOX_REPO_CWD,
  };
 }

@ -639,35 +636,27 @@ async function ensureSandboxRepo(c: any, sandbox: any, record: any, opts?: { ski
  // If the repo was already prepared and the caller allows skipping fetch, just return.
  // The clone, fetch, and checkout already happened on a prior call.
  if (opts?.skipFetchIfPrepared && sandboxRepoPrepared) {
-    logActorInfo("task.sandbox", "ensureSandboxRepo skipped (already prepared)");
    return;
  }

-  const repoStart = performance.now();
-
-  const t0 = performance.now();
  const auth = await resolveOrganizationGithubAuth(c, c.state.organizationId);
  const metadata = await getRepositoryMetadata(c);
-  logActorInfo("task.sandbox", "resolveAuth+metadata", { durationMs: Math.round(performance.now() - t0) });
-
  const baseRef = metadata.defaultBranch ?? "main";
-  // Use $HOME inside the shell script so the path resolves correctly regardless
-  // of which user the sandbox runs as (E2B: "user", local Docker: "sandbox").
+  const sandboxRepoRoot = dirname(SANDBOX_REPO_CWD);
  const script = [
    "set -euo pipefail",
-    'REPO_DIR="$HOME/repo"',
-    'mkdir -p "$HOME"',
+    `mkdir -p ${JSON.stringify(sandboxRepoRoot)}`,
    "git config --global credential.helper '!f() { echo username=x-access-token; echo password=${GH_TOKEN:-$GITHUB_TOKEN}; }; f'",
-    `if [ ! -d "$REPO_DIR/.git" ]; then rm -rf "$REPO_DIR" && git clone ${JSON.stringify(metadata.remoteUrl)} "$REPO_DIR"; fi`,
-    'cd "$REPO_DIR"',
+    `if [ ! -d ${JSON.stringify(`${SANDBOX_REPO_CWD}/.git`)} ]; then rm -rf ${JSON.stringify(SANDBOX_REPO_CWD)} && git clone ${JSON.stringify(
+      metadata.remoteUrl,
+    )} ${JSON.stringify(SANDBOX_REPO_CWD)}; fi`,
+    `cd ${JSON.stringify(SANDBOX_REPO_CWD)}`,
    "git fetch origin --prune",
    `if git show-ref --verify --quiet refs/remotes/origin/${JSON.stringify(record.branchName).slice(1, -1)}; then target_ref=${JSON.stringify(
      `origin/${record.branchName}`,
    )}; else target_ref=${JSON.stringify(baseRef)}; fi`,
    `git checkout -B ${JSON.stringify(record.branchName)} \"$target_ref\"`,
  ];
-
-  const t1 = performance.now();
  const result = await sandbox.runProcess({
    command: "bash",
    args: ["-lc", script.join("; ")],
@ -680,11 +669,6 @@ async function ensureSandboxRepo(c: any, sandbox: any, record: any, opts?: { ski
      : undefined,
    timeoutMs: 5 * 60_000,
  });
-  logActorInfo("task.sandbox", "git clone/fetch/checkout", {
-    branch: record.branchName,
-    repo: metadata.remoteUrl,
-    durationMs: Math.round(performance.now() - t1),
-  });

  if ((result.exitCode ?? 0) !== 0) {
    throw new Error(`sandbox repo preparation failed (${result.exitCode ?? 1}): ${[result.stdout, result.stderr].filter(Boolean).join("")}`);
@ -693,13 +677,10 @@ async function ensureSandboxRepo(c: any, sandbox: any, record: any, opts?: { ski
  // On first repo preparation, inject the task owner's git credentials into the sandbox
  // so that push/commit operations are authenticated and attributed to the correct user.
  if (!sandboxRepoPrepared && opts?.authSessionId) {
-    const t2 = performance.now();
    await maybeSwapTaskOwner(c, opts.authSessionId, sandbox);
-    logActorInfo("task.sandbox", "maybeSwapTaskOwner", { durationMs: Math.round(performance.now() - t2) });
  }

  sandboxRepoPrepared = true;
-  logActorInfo("task.sandbox", "ensureSandboxRepo complete", { totalDurationMs: Math.round(performance.now() - repoStart) });
 }

 async function executeInSandbox(
@ -1283,7 +1264,6 @@ export async function createWorkspaceSession(c: any, model?: string, authSession
 }

 export async function ensureWorkspaceSession(c: any, sessionId: string, model?: string, authSessionId?: string): Promise<void> {
-  const ensureStart = performance.now();
  const meta = await readSessionMeta(c, sessionId);
  if (!meta || meta.closed) {
    return;
@ -1303,18 +1283,10 @@ export async function ensureWorkspaceSession(c: any, sessionId: string, model?:
  });

  try {
-    const t0 = performance.now();
    const runtime = await getTaskSandboxRuntime(c, record);
-    logActorInfo("task.session", "getTaskSandboxRuntime", { sessionId, durationMs: Math.round(performance.now() - t0) });
-
-    const t1 = performance.now();
    await ensureSandboxRepo(c, runtime.sandbox, record);
-    logActorInfo("task.session", "ensureSandboxRepo", { sessionId, durationMs: Math.round(performance.now() - t1) });
-
    const resolvedModel = model ?? meta.model ?? (await resolveDefaultModel(c, authSessionId));
    const resolvedAgent = await resolveSandboxAgentForModel(c, resolvedModel);
-
-    const t2 = performance.now();
    await runtime.sandbox.createSession({
      id: meta.sandboxSessionId ?? sessionId,
      agent: resolvedAgent,
@ -1323,14 +1295,12 @@ export async function ensureWorkspaceSession(c: any, sessionId: string, model?:
        cwd: runtime.cwd,
      },
    });
-    logActorInfo("task.session", "createSession", { sessionId, agent: resolvedAgent, model: resolvedModel, durationMs: Math.round(performance.now() - t2) });

    await updateSessionMeta(c, sessionId, {
      sandboxSessionId: meta.sandboxSessionId ?? sessionId,
      status: "ready",
      errorMessage: null,
    });
-    logActorInfo("task.session", "ensureWorkspaceSession complete", { sessionId, totalDurationMs: Math.round(performance.now() - ensureStart) });
    fireRefreshSessionTranscript(c, meta.sandboxSessionId ?? sessionId);
  } catch (error) {
    await updateSessionMeta(c, sessionId, {
@ -1445,19 +1415,12 @@ export async function changeWorkspaceModel(c: any, sessionId: string, model: str
 }

 export async function sendWorkspaceMessage(c: any, sessionId: string, text: string, attachments: Array<any>, authSessionId?: string): Promise<void> {
-  const sendStart = performance.now();
  const meta = requireSendableSessionMeta(await readSessionMeta(c, sessionId), sessionId);
  const record = await ensureWorkspaceSeeded(c);
-
-  const t0 = performance.now();
  const runtime = await getTaskSandboxRuntime(c, record);
-  logActorInfo("task.message", "getTaskSandboxRuntime", { sessionId, durationMs: Math.round(performance.now() - t0) });
-
-  const t1 = performance.now();
  // Skip git fetch on subsequent messages — the repo was already prepared during session
  // creation. This avoids a 5-30s network round-trip to GitHub on every prompt.
  await ensureSandboxRepo(c, runtime.sandbox, record, { skipFetchIfPrepared: true, authSessionId });
-  logActorInfo("task.message", "ensureSandboxRepo", { sessionId, durationMs: Math.round(performance.now() - t1) });

  // Check if the task owner needs to swap. If a different user is sending this message,
  // update the owner record and inject their git credentials into the sandbox.
@ -1487,12 +1450,10 @@ export async function sendWorkspaceMessage(c: any, sessionId: string, text: stri
  await syncWorkspaceSessionStatus(c, meta.sandboxSessionId, "running", Date.now());

  try {
-    const t2 = performance.now();
    await runtime.sandbox.sendPrompt({
      sessionId: meta.sandboxSessionId,
      prompt: prompt.join("\n\n"),
    });
-    logActorInfo("task.message", "sendPrompt", { sessionId, durationMs: Math.round(performance.now() - t2) });
    await syncWorkspaceSessionStatus(c, meta.sandboxSessionId, "idle", Date.now());
  } catch (error) {
    await updateSessionMeta(c, sessionId, {
@ -1502,7 +1463,6 @@ export async function sendWorkspaceMessage(c: any, sessionId: string, text: stri
    await syncWorkspaceSessionStatus(c, meta.sandboxSessionId, "error", Date.now());
    throw error;
  }
-  logActorInfo("task.message", "sendWorkspaceMessage complete", { sessionId, totalDurationMs: Math.round(performance.now() - sendStart) });
 }

 export async function stopWorkspaceSession(c: any, sessionId: string): Promise<void> {
--- a/foundry/packages/backend/src/config/runner-version.ts
+++ b/foundry/packages/backend/src/config/runner-version.ts
@ -1,33 +0,0 @@
-import { readFileSync } from "node:fs";
-
-function parseRunnerVersion(rawValue: string | undefined): number | undefined {
-  const value = rawValue?.trim();
-  if (!value) {
-    return undefined;
-  }
-
-  const parsed = Number.parseInt(value, 10);
-  if (Number.isNaN(parsed)) {
-    return undefined;
-  }
-
-  return parsed;
-}
-
-export function resolveRunnerVersion(): number | undefined {
-  const envVersion = parseRunnerVersion(process.env.RIVET_RUNNER_VERSION);
-  if (envVersion !== undefined) {
-    return envVersion;
-  }
-
-  const versionFilePath = process.env.RIVET_RUNNER_VERSION_FILE;
-  if (!versionFilePath) {
-    return undefined;
-  }
-
-  try {
-    return parseRunnerVersion(readFileSync(versionFilePath, "utf8"));
-  } catch {
-    return undefined;
-  }
-}
--- a/foundry/packages/backend/src/index.ts
+++ b/foundry/packages/backend/src/index.ts
@ -141,59 +141,6 @@ export async function startBackend(options: BackendStartOptions = {}): Promise<v
  };
  app.use("/v1/*", cors(corsConfig));
  app.use("/v1", cors(corsConfig));
-
-  // On-demand memory snapshot endpoint for diagnosing spikes (dev only).
-  // Usage: curl http://127.0.0.1:7741/debug/memory
-  // Trigger GC first: curl http://127.0.0.1:7741/debug/memory?gc=1
-  // Write JSC heap snapshot: curl http://127.0.0.1:7741/debug/memory?heap=1
-  //   (writes /tmp/foundry-heap-<timestamp>.json, inspect with chrome://tracing)
-  app.get("/debug/memory", async (c) => {
-    if (process.env.NODE_ENV !== "development") {
-      return c.json({ error: "debug endpoints disabled in production" }, 403);
-    }
-    const wantGc = c.req.query("gc") === "1";
-    if (wantGc && typeof Bun !== "undefined") {
-      // Bun.gc(true) triggers a synchronous full GC sweep in JavaScriptCore.
-      Bun.gc(true);
-    }
-    const mem = process.memoryUsage();
-    const rssMb = Math.round(mem.rss / 1024 / 1024);
-    const heapUsedMb = Math.round(mem.heapUsed / 1024 / 1024);
-    const heapTotalMb = Math.round(mem.heapTotal / 1024 / 1024);
-    const externalMb = Math.round(mem.external / 1024 / 1024);
-    const nonHeapMb = rssMb - heapUsedMb - externalMb;
-    // Bun.heapStats() gives JSC-specific breakdown: object counts, typed array
-    // bytes, extra memory (native allocations tracked by JSC). Useful for
-    // distinguishing JS object bloat from native/WASM memory.
-    // eslint-disable-next-line @typescript-eslint/no-explicit-any
-    const BunAny = Bun as any;
-    const heapStats = typeof BunAny.heapStats === "function" ? BunAny.heapStats() : null;
-    const snapshot = {
-      rssMb,
-      heapUsedMb,
-      heapTotalMb,
-      externalMb,
-      nonHeapMb,
-      gcTriggered: wantGc,
-      rssBytes: mem.rss,
-      heapUsedBytes: mem.heapUsed,
-      heapTotalBytes: mem.heapTotal,
-      externalBytes: mem.external,
-      ...(heapStats ? { bunHeapStats: heapStats } : {}),
-    };
-    // Optionally write a full JSC heap snapshot for offline analysis.
-    let heapSnapshotPath: string | null = null;
-    const wantHeap = c.req.query("heap") === "1";
-    if (wantHeap && typeof Bun !== "undefined") {
-      heapSnapshotPath = `/tmp/foundry-heap-${Date.now()}.json`;
-      // Bun.generateHeapSnapshot("v8") returns a V8-compatible JSON string.
-      const heapJson = Bun.generateHeapSnapshot("v8");
-      await Bun.write(heapSnapshotPath, heapJson);
-    }
-    logger.info(snapshot, "memory_usage_debug");
-    return c.json({ ...snapshot, ...(heapSnapshotPath ? { heapSnapshotPath } : {}) });
-  });
-
  app.use("*", async (c, next) => {
    const requestId = c.req.header("x-request-id")?.trim() || randomUUID();
    const start = performance.now();
@ -407,11 +354,6 @@ export async function startBackend(options: BackendStartOptions = {}): Promise<v
    },
    hostname: config.backend.host,
    port: config.backend.port,
-    // Bun defaults to 10s idle timeout. Actor RPCs go through the gateway
-    // tunnel (not direct HTTP), and the SSE stream has a 1s ping interval
-    // (RUNNER_SSE_PING_INTERVAL in rivetkit), so the idle timeout likely
-    // never fires in practice. Set high as a safety net regardless.
-    idleTimeout: 255,
  });

  logger.info(
@ -422,42 +364,6 @@ export async function startBackend(options: BackendStartOptions = {}): Promise<v
    "backend_started",
  );

-  // Periodic memory usage reporting for diagnosing memory spikes (dev only).
-  // Logs JS heap, RSS, and external (native/WASM) separately so we can tell
-  // whether spikes come from JS objects, Bun/JSC internals, or native addons
-  // like SQLite/WASM.
-  if (process.env.NODE_ENV === "development") {
-    let prevRss = 0;
-    setInterval(() => {
-      const mem = process.memoryUsage();
-      const rssMb = Math.round(mem.rss / 1024 / 1024);
-      const heapUsedMb = Math.round(mem.heapUsed / 1024 / 1024);
-      const heapTotalMb = Math.round(mem.heapTotal / 1024 / 1024);
-      const externalMb = Math.round(mem.external / 1024 / 1024);
-      // Non-heap RSS: memory not accounted for by JS heap or external buffers.
-      // Large values here point to native allocations (WASM, mmap, child process
-      // bookkeeping, Bun's internal arena, etc.).
-      const nonHeapMb = rssMb - heapUsedMb - externalMb;
-      const deltaRss = rssMb - prevRss;
-      prevRss = rssMb;
-      logger.info(
-        {
-          rssMb,
-          heapUsedMb,
-          heapTotalMb,
-          externalMb,
-          nonHeapMb,
-          deltaRssMb: deltaRss,
-          rssBytes: mem.rss,
-          heapUsedBytes: mem.heapUsed,
-          heapTotalBytes: mem.heapTotal,
-          externalBytes: mem.external,
-        },
-        "memory_usage",
-      );
-    }, 60_000);
-  }
-
  process.on("SIGINT", async () => {
    server.stop();
    process.exit(0);
--- a/foundry/packages/client/package.json
+++ b/foundry/packages/client/package.json
@ -6,7 +6,7 @@
  "main": "dist/index.js",
  "types": "dist/index.d.ts",
  "scripts": {
-    "build": "tsup src/index.ts --format esm --dts --tsconfig tsconfig.build.json",
+    "build": "tsup src/index.ts --format esm --dts",
    "typecheck": "tsc --noEmit",
    "test": "vitest run",
    "test:e2e:full": "HF_ENABLE_DAEMON_FULL_E2E=1 vitest run test/e2e/full-integration-e2e.test.ts",
--- a/foundry/packages/client/src/subscription/remote-manager.ts
+++ b/foundry/packages/client/src/subscription/remote-manager.ts
@ -4,11 +4,6 @@ import { topicDefinitions, type TopicData, type TopicDefinition, type TopicKey,

 const GRACE_PERIOD_MS = 30_000;

-/** Initial retry delay in ms. */
-const RETRY_BASE_MS = 1_000;
-/** Maximum retry delay in ms. */
-const RETRY_MAX_MS = 30_000;
-
 /**
 * Remote implementation of SubscriptionManager.
 * Each cache entry owns one actor connection plus one materialized snapshot.
@ -85,12 +80,9 @@ class TopicEntry<TData, TParams, TEvent> {
  private unsubscribeEvent: (() => void) | null = null;
  private unsubscribeError: (() => void) | null = null;
  private teardownTimer: ReturnType<typeof setTimeout> | null = null;
-  private retryTimer: ReturnType<typeof setTimeout> | null = null;
-  private retryAttempt = 0;
  private startPromise: Promise<void> | null = null;
  private eventPromise: Promise<void> = Promise.resolve();
  private started = false;
-  private disposed = false;

  constructor(
    private readonly topicKey: TopicKey,
@ -144,9 +136,7 @@ class TopicEntry<TData, TParams, TEvent> {
  }

  dispose(): void {
-    this.disposed = true;
    this.cancelTeardown();
-    this.cancelRetry();
    this.unsubscribeEvent?.();
    this.unsubscribeError?.();
    if (this.conn) {
@ -158,55 +148,6 @@ class TopicEntry<TData, TParams, TEvent> {
    this.error = null;
    this.lastRefreshAt = null;
    this.started = false;
-    this.retryAttempt = 0;
-  }
-
-  private cancelRetry(): void {
-    if (this.retryTimer) {
-      clearTimeout(this.retryTimer);
-      this.retryTimer = null;
-    }
-  }
-
-  /**
-   * Schedules a retry with exponential backoff. Cleans up any existing
-   * connection state before reconnecting.
-   */
-  private scheduleRetry(): void {
-    if (this.disposed || this.listenerCount === 0) {
-      return;
-    }
-
-    const delay = Math.min(RETRY_BASE_MS * 2 ** this.retryAttempt, RETRY_MAX_MS);
-    this.retryAttempt++;
-
-    this.retryTimer = setTimeout(() => {
-      this.retryTimer = null;
-      if (this.disposed || this.listenerCount === 0) {
-        return;
-      }
-
-      // Tear down the old connection before retrying
-      this.cleanupConnection();
-      this.started = false;
-      this.startPromise = this.start().finally(() => {
-        this.startPromise = null;
-      });
-    }, delay);
-  }
-
-  /**
-   * Cleans up connection resources without resetting data/status/retry state.
-   */
-  private cleanupConnection(): void {
-    this.unsubscribeEvent?.();
-    this.unsubscribeError?.();
-    this.unsubscribeEvent = null;
-    this.unsubscribeError = null;
-    if (this.conn) {
-      void this.conn.dispose();
-    }
-    this.conn = null;
  }

  private async start(): Promise<void> {
@ -223,20 +164,17 @@ class TopicEntry<TData, TParams, TEvent> {
        this.status = "error";
        this.error = error instanceof Error ? error : new Error(String(error));
        this.notify();
-        this.scheduleRetry();
      });
      this.data = await this.definition.fetchInitial(this.backend, this.params);
      this.status = "connected";
      this.lastRefreshAt = Date.now();
      this.started = true;
-      this.retryAttempt = 0;
      this.notify();
    } catch (error) {
      this.status = "error";
      this.error = error instanceof Error ? error : new Error(String(error));
      this.started = false;
      this.notify();
-      this.scheduleRetry();
    }
  }

--- a/foundry/packages/client/tsconfig.build.json
+++ b/foundry/packages/client/tsconfig.build.json
@ -1,6 +0,0 @@
-{
-  "extends": "./tsconfig.json",
-  "compilerOptions": {
-    "ignoreDeprecations": "6.0"
-  }
-}
--- a/foundry/packages/frontend/src/components/mock-layout.tsx
+++ b/foundry/packages/frontend/src/components/mock-layout.tsx
@ -187,7 +187,6 @@ function toTaskModel(
    diffs: detail?.diffs ?? {},
    fileTree: detail?.fileTree ?? [],
    minutesUsed: detail?.minutesUsed ?? 0,
-    sandboxes: detail?.sandboxes ?? [],
    activeSandboxId: detail?.activeSandboxId ?? null,
    primaryUserLogin: detail?.primaryUserLogin ?? summary.primaryUserLogin ?? null,
    primaryUserAvatarUrl: detail?.primaryUserAvatarUrl ?? summary.primaryUserAvatarUrl ?? null,
--- a/foundry/packages/shared/package.json
+++ b/foundry/packages/shared/package.json
@ -6,7 +6,7 @@
  "main": "dist/index.js",
  "types": "dist/index.d.ts",
  "scripts": {
-    "build": "tsup src/index.ts --format esm --dts --tsconfig tsconfig.build.json",
+    "build": "tsup src/index.ts --format esm --dts",
    "typecheck": "tsc --noEmit",
    "test": "vitest run"
  },
--- a/foundry/packages/shared/tsconfig.build.json
+++ b/foundry/packages/shared/tsconfig.build.json
@ -1,6 +0,0 @@
-{
-  "extends": "./tsconfig.json",
-  "compilerOptions": {
-    "ignoreDeprecations": "6.0"
-  }
-}
--- a/foundry/research/friction/sandbox-agent.mdx
+++ b/foundry/research/friction/sandbox-agent.mdx
@ -55,7 +55,7 @@ Upgrading backend integration from legacy sandbox-agent session endpoints to `sa

 ### Friction / Issue

-`0.2.0` no longer exposes the legacy session REST endpoints used by the backend integration; direct session create/status polling via those paths returns `404`.
+`0.2.0` no longer exposes `/v1/sessions` endpoints used by the backend integration; direct session create/status polling via legacy REST paths returns `404`.

 ### Attempted Fix / Workaround

@ -65,5 +65,5 @@ Upgrading backend integration from legacy sandbox-agent session endpoints to `sa

 ### Outcome

- Backend no longer depends on removed legacy session REST endpoints.
+- Backend no longer depends on removed `/v1/sessions` endpoints.
 - Daytona flow is aligned with `sandbox-agent 0.2.0` runtime and SDK usage.
--- a/frontend/packages/website/src/components/GetStarted.tsx
+++ b/frontend/packages/website/src/components/GetStarted.tsx
@ -103,7 +103,7 @@ function SdkCodeHighlighted() {
  );
 }

-const sandboxCommand = `curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh`;
+const sandboxCommand = `curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh`;

 const sourceCommands = `git clone https://github.com/rivet-dev/sandbox-agent
 cd sandbox-agent
@ -196,7 +196,7 @@ export function GetStarted() {
                    <span className="text-zinc-300">curl -fsSL \</span>
                    {"\n"}
                    <span className="text-zinc-300">{"    "}</span>
-                    <span className="text-green-400">https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh</span>
+                    <span className="text-green-400">https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh</span>
                    <span className="text-zinc-300"> | </span>
                    <span className="text-blue-400">sh</span>
                  </code>
--- a/1
+++ b/1
@ -186,3 +186,4 @@ foundry-format:
 [group('foundry')]
 foundry-docker-build tag='foundry:local':
 	docker build -f foundry/docker/backend.Dockerfile -t {{tag}} .
+
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@ -450,31 +450,6 @@ importers:
        specifier: latest
        version: 5.9.3

-  examples/sprites:
-    dependencies:
-      '@fly/sprites':
-        specifier: latest
-        version: 0.0.1
-      '@sandbox-agent/example-shared':
-        specifier: workspace:*
-        version: link:../shared
-      sandbox-agent:
-        specifier: workspace:*
-        version: link:../../sdks/typescript
-    devDependencies:
-      '@types/node':
-        specifier: latest
-        version: 25.5.0
-      tsx:
-        specifier: latest
-        version: 4.21.0
-      typescript:
-        specifier: latest
-        version: 6.0.2
-      vitest:
-        specifier: ^3.0.0
-        version: 3.2.4(@types/debug@4.1.12)(@types/node@25.5.0)(jiti@1.21.7)(jsdom@26.1.0)(tsx@4.21.0)(yaml@2.8.2)
-
  examples/vercel:
    dependencies:
      '@sandbox-agent/example-shared':
@ -556,7 +531,7 @@ importers:
        version: 1.3.10
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)

  foundry/packages/client:
    dependencies:
@ -578,7 +553,7 @@ importers:
        version: 19.2.14
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)

  foundry/packages/frontend:
    dependencies:
@ -639,7 +614,7 @@ importers:
        version: 0.1.27(@types/react@19.2.14)(react@19.2.4)
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)
      vite:
        specifier: ^7.1.3
        version: 7.3.1(@types/node@25.5.0)(jiti@1.21.7)(tsx@4.21.0)(yaml@2.8.2)
@ -658,7 +633,7 @@ importers:
    devDependencies:
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)

  frontend/packages/inspector:
    dependencies:
@ -796,6 +771,25 @@ importers:
        specifier: ^5.7.0
        version: 5.9.3

+  scripts/sandbox-testing:
+    dependencies:
+      '@daytonaio/sdk':
+        specifier: latest
+        version: 0.151.0(ws@8.19.0)
+      '@e2b/code-interpreter':
+        specifier: latest
+        version: 2.3.3
+    devDependencies:
+      '@types/node':
+        specifier: latest
+        version: 25.5.0
+      tsx:
+        specifier: latest
+        version: 4.21.0
+      typescript:
+        specifier: latest
+        version: 5.9.3
+
  sdks/acp-http-client:
    dependencies:
      '@agentclientprotocol/sdk':
@ -994,9 +988,6 @@ importers:
      '@e2b/code-interpreter':
        specifier: '>=1.0.0'
        version: 2.3.3
-      '@fly/sprites':
-        specifier: '>=0.0.1'
-        version: 0.0.1
      '@types/dockerode':
        specifier: ^4.0.0
        version: 4.0.1
@ -2496,10 +2487,6 @@ packages:
    resolution: {integrity: sha512-vBZP4NlzfOlerQTnba4aqZoMhE/a9HY7HRqoOPaETQcSQuWEIyZMHGfVu6w9wGtGK5fED5qRs2DteVCjOH60sA==}
    engines: {node: '>=14'}

-  '@fly/sprites@0.0.1':
-    resolution: {integrity: sha512-1s+dIVi/pTMP4Aj4Mkg+4LoZ/+a0Kp6l9piPRxvpgEKm11b/eRiZgJwVytwAHeI/vtg2fuwcFExjtXOEfny/TA==}
-    engines: {node: '>=24.0.0'}
-
  '@grpc/grpc-js@1.14.3':
    resolution: {integrity: sha512-Iq8QQQ/7X3Sac15oB6p0FmUg/klxQvXLeileoqrTRGJYLV+/9tubbr9ipz0GKHjmXVsgFPo/+W+2cA8eNcR+XA==}
    engines: {node: '>=12.10.0'}
@ -6950,11 +6937,6 @@ packages:
    engines: {node: '>=14.17'}
    hasBin: true

-  typescript@6.0.2:
-    resolution: {integrity: sha512-bGdAIrZ0wiGDo5l8c++HWtbaNCWTS4UTv7RaTH/ThVIgjkveJt83m74bBHMJkuCbslY8ixgLBVZJIOiQlQTjfQ==}
-    engines: {node: '>=14.17'}
-    hasBin: true
-
  ufo@1.6.3:
    resolution: {integrity: sha512-yDJTmhydvl5lJzBmy/hyOAA0d+aqCBuwl818haVdYCRrWV84o7YyeVm4QlVHStqNrrJSTb6jKuFAVqAFsr+K3Q==}

@ -8993,8 +8975,6 @@ snapshots:

  '@fastify/busboy@2.1.1': {}

-  '@fly/sprites@0.0.1': {}
-
  '@grpc/grpc-js@1.14.3':
    dependencies:
      '@grpc/proto-loader': 0.8.0
@ -14164,34 +14144,6 @@ snapshots:
      - tsx
      - yaml

-  tsup@8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2):
-    dependencies:
-      bundle-require: 5.1.0(esbuild@0.27.3)
-      cac: 6.7.14
-      chokidar: 4.0.3
-      consola: 3.4.2
-      debug: 4.4.3
-      esbuild: 0.27.3
-      fix-dts-default-cjs-exports: 1.0.1
-      joycon: 3.1.1
-      picocolors: 1.1.1
-      postcss-load-config: 6.0.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(yaml@2.8.2)
-      resolve-from: 5.0.0
-      rollup: 4.56.0
-      source-map: 0.7.6
-      sucrase: 3.35.1
-      tinyexec: 0.3.2
-      tinyglobby: 0.2.15
-      tree-kill: 1.2.2
-    optionalDependencies:
-      postcss: 8.5.6
-      typescript: 6.0.2
-    transitivePeerDependencies:
-      - jiti
-      - supports-color
-      - tsx
-      - yaml
-
  tsx@4.21.0:
    dependencies:
      esbuild: 0.27.3
@ -14242,8 +14194,6 @@ snapshots:

  typescript@5.9.3: {}

-  typescript@6.0.2: {}
-
  ufo@1.6.3: {}

  ultrahtml@1.6.0: {}
--- a/pnpm-workspace.yaml
+++ b/pnpm-workspace.yaml
@ -10,5 +10,6 @@ packages:
  - "sdks/gigacode/platforms/*"
  - "resources/vercel-ai-sdk-schemas"
  - "scripts/release"
+  - "scripts/sandbox-testing"
  - "examples/*"
  - "server/packages/sandbox-agent/tests/opencode-compat"
--- a/research/acp/friction.md
+++ b/research/acp/friction.md
@ -81,7 +81,7 @@ Update this file continuously during the migration.
 - Date: 2026-02-10
 - Area: Session lifecycle surface
 - Issue: ACP stable does not include v1-equivalent methods for session listing, explicit session termination/delete, or event-log polling.
- Impact: Direct lift-and-shift of the legacy session REST list, terminate, and event-polling behavior is not possible with ACP core only.
+- Impact: Direct lift-and-shift of `/v1/sessions`, `/terminate`, and `/events` polling is not possible with ACP core only.
 - Proposed direction: Define `_sandboxagent/session/*` extension methods for these control operations, while keeping core prompt flow on standard ACP methods.
 - Decision: Open.
 - Owner: Unassigned.
--- a/research/acp/inspector-unimplemented.md
+++ b/research/acp/inspector-unimplemented.md
@ -11,4 +11,4 @@ This tracks legacy inspector behaviors that do not yet have full parity on ACP v
 5. TDOO: Agent mode discovery before creating a session is not implemented (inspector currently returns cached-or-empty mode lists).
 6. TDOO: Agent model discovery before creating a session is not implemented (inspector currently returns cached-or-empty model lists).
 7. TDOO: Session listing only reflects sessions created by this inspector client instance (not full server/global session inventory).
-8. TDOO: Event history shown in inspector is synthesized from ACP traffic handled by the inspector compatibility layer, not the old canonical session-events backend history.
+8. TDOO: Event history shown in inspector is synthesized from ACP traffic handled by the inspector compatibility layer, not the old canonical `/v1/sessions/*/events` backend history.
--- a/research/acp/merge-acp.md
+++ b/research/acp/merge-acp.md
@ -20,8 +20,8 @@ Static v1 endpoints today:

 - `GET /v1/agents`
 - `POST /v1/agents/:agent/install`
- legacy session list endpoint
- legacy session detail endpoint
+- `GET /v1/sessions`
+- `GET /v1/sessions/:session_id`
 - `GET /v1/fs/entries`
 - `GET /v1/fs/file`
 - `PUT /v1/fs/file`
@ -76,8 +76,8 @@ Interpretation for clients: all agent/session operations and non-binary filesyst
 | --- | --- | --- |
 | `GET /v1/agents` | `_sandboxagent/agent/list` | Response keeps current `AgentListResponse` shape for low migration risk. |
 | `POST /v1/agents/:agent/install` | `_sandboxagent/agent/install` | Params include `agent`, `reinstall`, `agentVersion`, `agentProcessVersion`. |
-| legacy session list endpoint | `_sandboxagent/session/list` | Return current `SessionListResponse` shape (not ACP unstable list shape). |
-| legacy session detail endpoint | `_sandboxagent/session/get` | Return current `SessionInfo` shape; error on missing session. |
+| `GET /v1/sessions` | `_sandboxagent/session/list` | Return current `SessionListResponse` shape (not ACP unstable list shape). |
+| `GET /v1/sessions/:session_id` | `_sandboxagent/session/get` | Return current `SessionInfo` shape; error on missing session. |
 | `GET /v1/fs/entries` | `_sandboxagent/fs/list_entries` | Preserve path + optional `sessionId` resolution semantics. |
 | `GET /v1/fs/file` | keep HTTP + `_sandboxagent/fs/read_file` | HTTP is primary because responses may require large streaming reads; ACP variant exists for compatibility/smaller payloads. |
 | `PUT /v1/fs/file` | keep HTTP + `_sandboxagent/fs/write_file` | HTTP is primary for large binary writes; ACP variant exists for compatibility/smaller payloads. |
@ -143,7 +143,7 @@ Package boundary after migration:

 - `acp-http-client` remains protocol-pure ACP transport and generic `extMethod`/`extNotification`.
 - `sandbox-agent` remains the typed wrapper that maps convenience methods to `_sandboxagent/...` extension methods.
- No direct legacy agents/session REST fetches or non-binary `/v1/fs/*` fetches in SDK runtime code.
+- No direct `/v1/agents*`, `/v1/sessions*`, or non-binary `/v1/fs/*` fetches in SDK runtime code.
 - Binary file transfer keeps direct HTTP fetches on the three endpoints listed above.
 - SDK policy: prefer HTTP for `readFsFile`/`writeFsFile`/`uploadFsBatch` even if ACP extension variants exist.

@ -184,17 +184,17 @@ Alternative (optional): introduce a runtime-only control connection mode that do
 - TypeScript SDK (`sdks/typescript/src/client.ts`):
  - Repoint `listAgents`, `installAgent`, `listSessions`, `getSession`, `listFsEntries`, `deleteFsEntry`, `mkdirFs`, `moveFs`, and `statFs` to ACP extension calls.
  - Keep `readFsFile`, `writeFsFile`, and `uploadFsBatch` on HTTP endpoints.
-  - Remove direct runtime fetch usage for legacy agents/session REST endpoints and non-binary `/v1/fs/*`.
+  - Remove direct runtime fetch usage for `/v1/agents*`, `/v1/sessions*`, and non-binary `/v1/fs/*`.
  - Keep method names stable for callers.
  - Move these methods to connected-only semantics (`NotConnectedError` when disconnected).
 - CLI (`server/packages/sandbox-agent/src/cli.rs`):
-  - Make `api agents list/install` call ACP extension methods (via ACP post flow), not direct legacy agent HTTP calls.
+  - Make `api agents list/install` call ACP extension methods (via ACP post flow), not direct `/v1/agents*` HTTP calls.
 - Inspector flow/docs:
  - Stop depending on `GET /v1/agents` in startup path; use ACP extension instead.

 ### Phase 3: Remove Static Endpoints (Except Health + Binary FS Transfer)

- Remove route registrations for legacy agent/session REST endpoints and `/v1/fs/entries`, `/v1/fs/entry`, `/v1/fs/mkdir`, `/v1/fs/move`, `/v1/fs/stat` from `router.rs`.
+- Remove route registrations for `/v1/agents*`, `/v1/sessions*`, `/v1/fs/entries`, `/v1/fs/entry`, `/v1/fs/mkdir`, `/v1/fs/move`, `/v1/fs/stat` from `router.rs`.
 - Keep `/v1/health`, `/v1/rpc`, `GET /v1/fs/file`, `PUT /v1/fs/file`, and `POST /v1/fs/upload-batch`.
 - Optional short deprecation period: convert removed routes to `410 Gone` with explicit extension method in `detail`.

@ -237,6 +237,6 @@ Inspector:

 ## Open Decisions

-1. Should removed legacy agent/session REST endpoints and non-binary `/v1/fs/*` return `410` for one release or be dropped immediately?
+1. Should removed `/v1/agents*`, `/v1/sessions*`, and non-binary `/v1/fs/*` return `410` for one release or be dropped immediately?
 2. Do we keep a strict response-shape parity layer for session/file methods, or normalize to ACP-native shapes?
 3. Should `/` service-root remain as informational HTTP, or be treated as out-of-scope for this “only health static + binary fs transfer” policy?
--- a/research/acp/missing-features-spec/01-questions.md
+++ b/research/acp/missing-features-spec/01-questions.md
@ -59,11 +59,11 @@ struct PendingQuestion {
 }
 ```

-## Legacy Session REST Endpoints (from `router.rs`)
+## v1 HTTP Endpoints (from `router.rs`)

 ```
-session question reply endpoint   -> 204 No Content
-session question reject endpoint  -> 204 No Content
+POST /v1/sessions/{session_id}/questions/{question_id}/reply   -> 204 No Content
+POST /v1/sessions/{session_id}/questions/{question_id}/reject   -> 204 No Content
 ```

 ### `reply_question` handler
@ -122,7 +122,7 @@ Key flow:

 1. Agent emits `question.requested` event with `QuestionEventData { status: Requested, question_id, prompt, options }`
 2. Client renders question UI
-3. Client calls the legacy session question reply or reject endpoint with `{ answers: [["selected"]] }`
+3. Client calls `POST /v1/sessions/{id}/questions/{qid}/reply` with `{ answers: [["selected"]] }` or `POST .../reject`
 4. System emits `question.resolved` event with `QuestionEventData { status: Answered, response: Some("...") }` or `{ status: Rejected }`

 ## v1 Agent Capability
--- a/research/acp/missing-features-spec/07-session-termination.md
+++ b/research/acp/missing-features-spec/07-session-termination.md
@ -4,7 +4,7 @@

 ## Summary

-The legacy session REST API had an explicit terminate endpoint. ACP only has `session/cancel` (turn cancellation, not session kill) and `DELETE /v1/rpc` (connection close, not session termination). Need explicit session destroy/terminate semantics.
+v1 had explicit session termination (`POST /v1/sessions/{id}/terminate`). v1 only has `session/cancel` (turn cancellation, not session kill) and `DELETE /v1/rpc` (connection close, not session termination). Need explicit session destroy/terminate semantics.

 ## Current v1 State

@ -20,7 +20,7 @@ The legacy session REST API had an explicit terminate endpoint. ACP only has `se
 ### HTTP Endpoint

 ```
-legacy session terminate endpoint
+POST /v1/sessions/{id}/terminate
 ```

 ### Handler (from `router.rs`)
--- a/research/acp/missing-features-spec/08-model-variants.md
+++ b/research/acp/missing-features-spec/08-model-variants.md
@ -49,7 +49,7 @@ Returned `AgentModelsResponse` with full model list including variants.
 ### Session Creation with Variant

 ```
-legacy session create endpoint
+POST /v1/sessions
 ```

 Body included `variant: Option<String>` to select a specific model variant at session creation time.
--- a/research/acp/missing-features-spec/10-include-raw.md
+++ b/research/acp/missing-features-spec/10-include-raw.md
@ -34,7 +34,7 @@ pub struct UniversalEvent {
 ### v1 Usage

 ```
-legacy event polling endpoint with `include_raw=true`
+GET /v1/sessions/{id}/events?include_raw=true
 ```

 When `include_raw=true`, each `UniversalEvent` included the verbatim JSON the agent process emitted before normalization into the universal schema.
--- a/research/acp/missing-features-spec/16-session-info.md
+++ b/research/acp/missing-features-spec/16-session-info.md
@ -1,10 +1,10 @@
 # Feature 16: Session Info

-**Implementation approach:** New session-info HTTP endpoints
+**Implementation approach:** New HTTP endpoints (`GET /v1/sessions`, `GET /v1/sessions/{id}`)

 ## Summary

-v1 `SessionInfo` tracked `event_count`, `created_at`, `updated_at`, and full `mcp` config. v1 has session data in the ACP runtime's `MetaSession` struct but no HTTP endpoints to query it. Add HTTP endpoints for session listing and detail.
+v1 `SessionInfo` tracked `event_count`, `created_at`, `updated_at`, and full `mcp` config. v1 has session data in the ACP runtime's `MetaSession` struct but no HTTP endpoints to query it. Add REST endpoints for session listing and detail.

 ## Current v1 State

@ -117,8 +117,8 @@ fn build_session_info(state: &SessionState) -> SessionInfo {
 ### New HTTP Endpoints

 ```
-session list endpoint         -> SessionListResponse
-session detail endpoint       -> SessionInfo
+GET /v1/sessions              -> SessionListResponse
+GET /v1/sessions/{id}         -> SessionInfo
 ```

 These are control-plane HTTP endpoints (not ACP), providing session visibility without requiring an active ACP connection.
@ -156,7 +156,7 @@ Need to add:

 | File | Change |
 |------|--------|
-| `server/packages/sandbox-agent/src/router.rs` | Add session list and session detail handlers; add response types |
+| `server/packages/sandbox-agent/src/router.rs` | Add `GET /v1/sessions` and `GET /v1/sessions/{id}` handlers; add response types |
 | `server/packages/sandbox-agent/src/acp_runtime/mod.rs` | Add `created_at` to `MetaSession`; add `ended` tracking; expose `list_sessions()` and `get_session()` public methods |
 | `sdks/typescript/src/client.ts` | Add `listSessions()` and `getSession(id)` methods |
 | `server/packages/sandbox-agent/tests/v1_api.rs` | Add session listing and detail tests |
@ -165,6 +165,6 @@ Need to add:

 | Doc | Change |
 |-----|--------|
-| `docs/openapi.json` | Add session list and session detail endpoint specs |
+| `docs/openapi.json` | Add `/v1/sessions` and `/v1/sessions/{id}` endpoint specs |
 | `docs/cli.mdx` | Add CLI `sessions list` and `sessions info` commands |
 | `docs/sdks/typescript.mdx` | Document session listing SDK methods |
--- a/research/acp/missing-features-spec/17-error-termination-metadata.md
+++ b/research/acp/missing-features-spec/17-error-termination-metadata.md
@ -171,7 +171,7 @@ When an agent process terminates with an error:
 ### Session Info Integration

 Termination metadata should be accessible via:
- the session info endpoint (Feature #16) — include `terminationInfo` in response when session has ended
+- `GET /v1/sessions/{id}` (Feature #16) — include `terminationInfo` in response when session has ended
 - `session/list` ACP response — include termination status in session entries

 ### Files to Modify
--- a/research/acp/missing-features-spec/plan.md
+++ b/research/acp/missing-features-spec/plan.md
@ -36,7 +36,7 @@ Session-level features that build on Phase A runtime tracking.

 | Order | Feature                                                      | Spec | Approach                                             | Effort |
 |:-----:|--------------------------------------------------------------|:----:|------------------------------------------------------|:------:|
-| B1    | [Session Info](./16-session-info.md)                         | #16  | New session info HTTP endpoints                     | Medium |
+| B1    | [Session Info](./16-session-info.md)                         | #16  | New `GET /v1/sessions` and `GET /v1/sessions/{id}`  | Medium |
 | B2    | [Session Termination](./07-session-termination.md)           | #7   | Idempotent `_sandboxagent/session/terminate`         | Medium |
 | B3    | [Error Termination Metadata](./17-error-termination-metadata.md) | #17  | Stderr capture + `_sandboxagent/session/ended` event | Medium |

--- a/research/acp/old-rest-openapi-list.md
+++ b/research/acp/old-rest-openapi-list.md
@ -17,16 +17,16 @@
 | /v1/fs/stat | UNIMPLEMENTED |
 | /v1/fs/upload-batch | UNIMPLEMENTED |
 | /v1/health | UNIMPLEMENTED |
-| legacy session list route | session/list (UNSTABLE) |
-| legacy session create/load/resume route | session/new \| session/load \| session/resume (UNSTABLE) |
-| legacy session events polling route | UNIMPLEMENTED |
-| legacy session events SSE route | session/update (notification stream) |
-| legacy session prompt route | session/prompt |
-| legacy session prompt + stream route | session/prompt + session/update notifications |
-| legacy permission reply route | session/request_permission response |
-| legacy question reject route | UNIMPLEMENTED |
-| legacy question reply route | UNIMPLEMENTED |
-| legacy session terminate route | session/cancel (turn cancellation only) |
+| /v1/sessions | session/list (UNSTABLE) |
+| /v1/sessions/{session_id} | session/new \| session/load \| session/resume (UNSTABLE) |
+| /v1/sessions/{session_id}/events | UNIMPLEMENTED |
+| /v1/sessions/{session_id}/events/sse | session/update (notification stream) |
+| /v1/sessions/{session_id}/messages | session/prompt |
+| /v1/sessions/{session_id}/messages/stream | session/prompt + session/update notifications |
+| /v1/sessions/{session_id}/permissions/{permission_id}/reply | session/request_permission response |
+| /v1/sessions/{session_id}/questions/{question_id}/reject | UNIMPLEMENTED |
+| /v1/sessions/{session_id}/questions/{question_id}/reply | UNIMPLEMENTED |
+| /v1/sessions/{session_id}/terminate | session/cancel (turn cancellation only) |
 | AgentCapabilities | initialize.result.agentCapabilities |
 | AgentCapabilities.commandExecution | UNIMPLEMENTED |
 | AgentCapabilities.errorEvents | UNIMPLEMENTED |
@ -427,7 +427,7 @@

 - `UNIMPLEMENTED` means there is no ACP-standard field/method with equivalent semantics in `schema.unstable.json`; implementation would require ACP extension methods (`_...`) and/or `_meta` payloads.
 - Rows mapped to `_meta[...]` are ACP-compatible extensions, not standard interoperable ACP fields; both sides must agree on names and semantics.
- Legacy event polling has no ACP equivalent; ACP is stream-first via `session/update` notifications over streamable HTTP.
+- Legacy event polling (`/v1/sessions/{session_id}/events`) has no ACP equivalent; ACP is stream-first via `session/update` notifications over streamable HTTP.
 - Session lifecycle differs: ACP has `session/new`, `session/load`, `session/resume` (UNSTABLE), and `session/fork` (UNSTABLE), but no standard explicit "close session" method.
 - Permission handling is request/response (`session/request_permission`) tied to JSON-RPC request IDs; it does not use standalone REST reply endpoints.
 - Question/answer HITL flow in the old schema has no standard ACP equivalent today (separate from permission prompts).
--- a/research/acp/spec.md
+++ b/research/acp/spec.md
@ -233,6 +233,8 @@ Non-ACP endpoints retained in v1:
 - `GET /v1/health`
 - `GET /v1/agents` (capabilities + install status)
 - `POST /v1/agents/{agent}/install`
+- `GET /v1/sessions`
+- `GET /v1/sessions/{id}`
 - `GET /v1/fs/file`
 - `PUT /v1/fs/file`
 - `POST /v1/fs/upload-batch`
--- a/research/acp/v1-schema-to-acp-mapping.md
+++ b/research/acp/v1-schema-to-acp-mapping.md
@ -54,16 +54,16 @@ Extension namespace used in this spec:
 | `POST /v1/fs/move` | `POST /v1/fs/move` | HTTP platform API | Port v1 behavior. |
 | `GET /v1/fs/stat` | `GET /v1/fs/stat` | HTTP platform API | Port v1 behavior. |
 | `POST /v1/fs/upload-batch` | `POST /v1/fs/upload-batch` | HTTP platform API | Tar upload/extract behavior from v1. |
-| legacy session list route | session/list | HTTP control-plane | Session inventory without ACP connection requirement. |
-| legacy session create route | `session/new` | Standard | Path `session_id` becomes alias in `_meta["sandboxagent.dev"].requestedSessionId`. |
-| legacy session prompt route | `session/prompt` | Standard | Asynchronous behavior comes from transport (request + stream). |
-| legacy session prompt + stream route | `session/prompt` + consume `session/update` on SSE | Standard | Streaming is transport-level, not a distinct ACP method. |
-| legacy session terminate route | `_sandboxagent/session/terminate` | Extension | Idempotent termination semantics distinct from `DELETE /v1/rpc`. |
-| legacy event polling route | `_sandboxagent/session/events` (poll view over ACP stream) | Extension | Optional compatibility helper; canonical v1 is stream consumption. |
-| legacy event SSE route | `GET /v1/rpc` SSE stream | Standard transport | Filter by sessionId client-side or via connection/session binding. |
-| legacy permission reply route | JSON-RPC response to pending `session/request_permission` request id | Standard | Bridge `permission_id` to request `id` in transport state. |
-| legacy question reply route | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | ACP stable has no generic question/HITL request method. |
-| legacy question reject route | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | Encode rejection in response outcome. |
+| `GET /v1/sessions` | `GET /v1/sessions` | HTTP control-plane | Session inventory without ACP connection requirement. |
+| `POST /v1/sessions/{session_id}` | `session/new` | Standard | Path `session_id` becomes alias in `_meta["sandboxagent.dev"].requestedSessionId`. |
+| `POST /v1/sessions/{session_id}/messages` | `session/prompt` | Standard | Asynchronous behavior comes from transport (request + stream). |
+| `POST /v1/sessions/{session_id}/messages/stream` | `session/prompt` + consume `session/update` on SSE | Standard | Streaming is transport-level, not a distinct ACP method. |
+| `POST /v1/sessions/{session_id}/terminate` | `_sandboxagent/session/terminate` | Extension | Idempotent termination semantics distinct from `DELETE /v1/rpc`. |
+| `GET /v1/sessions/{session_id}/events` | `_sandboxagent/session/events` (poll view over ACP stream) | Extension | Optional compatibility helper; canonical v1 is stream consumption. |
+| `GET /v1/sessions/{session_id}/events/sse` | `GET /v1/rpc` SSE stream | Standard transport | Filter by sessionId client-side or via connection/session binding. |
+| `POST /v1/sessions/{session_id}/permissions/{permission_id}/reply` | JSON-RPC response to pending `session/request_permission` request id | Standard | Bridge `permission_id` to request `id` in transport state. |
+| `POST /v1/sessions/{session_id}/questions/{question_id}/reply` | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | ACP stable has no generic question/HITL request method. |
+| `POST /v1/sessions/{session_id}/questions/{question_id}/reject` | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | Encode rejection in response outcome. |

 ### 3.1 `CreateSessionRequest` field mapping

--- a/scripts/release/update_version.ts
+++ b/scripts/release/update_version.ts
@ -45,6 +45,7 @@ const VERSION_REFERENCE_FILES = [
  "scripts/release/main.ts",
  "scripts/release/promote-artifacts.ts",
  "scripts/release/sdk.ts",
+  "scripts/sandbox-testing/test-sandbox.ts",
 ];

 export async function updateVersion(opts: ReleaseOpts) {
@ -147,7 +148,7 @@ async function updateVersionReferences(opts: ReleaseOpts, oldVersion: string, ol

    const original = content;

-    // Replace minor channel references (e.g. sandbox-agent@0.5.x -> sandbox-agent@0.5.x)
+    // Replace minor channel references (e.g. sandbox-agent@0.3.x -> sandbox-agent@0.4.x)
    content = content.replaceAll(`sandbox-agent@${oldMinorChannel}`, `sandbox-agent@${newMinorChannel}`);
    content = content.replaceAll(`@sandbox-agent/cli@${oldMinorChannel}`, `@sandbox-agent/cli@${newMinorChannel}`);
    content = content.replaceAll(`@sandbox-agent/react@${oldMinorChannel}`, `@sandbox-agent/react@${newMinorChannel}`);
@ -155,13 +156,6 @@ async function updateVersionReferences(opts: ReleaseOpts, oldVersion: string, ol
    // Replace install script URL channel
    content = content.replaceAll(`releases.rivet.dev/sandbox-agent/${oldMinorChannel}/`, `releases.rivet.dev/sandbox-agent/${newMinorChannel}/`);

-    // If references drifted (for example Cargo.toml version was bumped without updating docs),
-    // normalize any other pinned minor-channel references to the release's channel.
-    content = content.replaceAll(/sandbox-agent@0\.\d+\.x/g, `sandbox-agent@${newMinorChannel}`);
-    content = content.replaceAll(/@sandbox-agent\/cli@0\.\d+\.x/g, `@sandbox-agent/cli@${newMinorChannel}`);
-    content = content.replaceAll(/@sandbox-agent\/react@0\.\d+\.x/g, `@sandbox-agent/react@${newMinorChannel}`);
-    content = content.replaceAll(/releases\.rivet\.dev\/sandbox-agent\/0\.\d+\.x\//g, `releases.rivet.dev/sandbox-agent/${newMinorChannel}/`);
-
    // Replace Docker image tags (rivetdev/sandbox-agent:<anything>-full -> rivetdev/sandbox-agent:<version>-full)
    content = content.replaceAll(
      new RegExp(`rivetdev/sandbox-agent:[0-9]+\\.[0-9]+\\.[0-9]+(?:-[a-zA-Z0-9.]+)?-full`, "g"),
@ -180,7 +174,7 @@ async function updateVersionReferences(opts: ReleaseOpts, oldVersion: string, ol
  }

  if (modifiedFiles.length > 0) {
-    await $({ cwd: opts.root })`git add -f ${modifiedFiles}`;
+    await $({ cwd: opts.root })`git add ${modifiedFiles}`;
    console.log(`\nUpdated ${modifiedFiles.length} files with version references.`);
  } else {
    console.log(`\nNo version reference files needed updates.`);
--- a/scripts/sandbox-testing/package.json
+++ b/scripts/sandbox-testing/package.json
@ -0,0 +1,21 @@
+{
+  "name": "@sandbox-agent/testing",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "test": "tsx test-sandbox.ts",
+    "test:docker": "tsx test-sandbox.ts docker",
+    "test:daytona": "tsx test-sandbox.ts daytona",
+    "test:mock": "tsx test-sandbox.ts docker --agent=mock",
+    "test:verbose": "tsx test-sandbox.ts docker --verbose"
+  },
+  "dependencies": {
+    "@daytonaio/sdk": "latest",
+    "@e2b/code-interpreter": "latest"
+  },
+  "devDependencies": {
+    "@types/node": "latest",
+    "tsx": "latest",
+    "typescript": "latest"
+  }
+}
--- a/scripts/sandbox-testing/test-sandbox.ts
+++ b/scripts/sandbox-testing/test-sandbox.ts
@ -0,0 +1,720 @@
+#!/usr/bin/env npx tsx
+/**
+ * Sandbox Testing Script
+ *
+ * Tests sandbox-agent on various cloud sandbox providers.
+ * Usage: npx tsx test-sandbox.ts [provider] [options]
+ *
+ * Providers: daytona, e2b, docker
+ *
+ * Options:
+ *   --skip-build          Skip cargo build step
+ *   --use-release         Use pre-built release binary from releases.rivet.dev
+ *   --agent <name>        Test specific agent (claude, codex, mock)
+ *   --skip-agent-install  Skip pre-installing agents (tests on-demand install like Daytona example)
+ *   --keep-alive          Don't cleanup sandbox after test
+ *   --verbose             Show all logs
+ */
+
+import { execSync, spawn } from "node:child_process";
+import { existsSync, readFileSync, mkdtempSync, writeFileSync, rmSync } from "node:fs";
+import { homedir, tmpdir } from "node:os";
+import { join, dirname } from "node:path";
+import { fileURLToPath } from "node:url";
+
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const ROOT_DIR = join(__dirname, "../..");
+const SERVER_DIR = join(ROOT_DIR, "server");
+
+// Parse args
+const args = process.argv.slice(2);
+const provider = args.find((a) => !a.startsWith("--")) || "docker";
+const skipBuild = args.includes("--skip-build");
+const useRelease = args.includes("--use-release");
+const skipAgentInstall = args.includes("--skip-agent-install");
+const keepAlive = args.includes("--keep-alive");
+const verbose = args.includes("--verbose");
+const agentArg = args.find((a) => a.startsWith("--agent="))?.split("=")[1];
+
+// Colors
+const log = {
+  info: (msg: string) => console.log(`\x1b[34m[INFO]\x1b[0m ${msg}`),
+  success: (msg: string) => console.log(`\x1b[32m[OK]\x1b[0m ${msg}`),
+  error: (msg: string) => console.log(`\x1b[31m[ERROR]\x1b[0m ${msg}`),
+  warn: (msg: string) => console.log(`\x1b[33m[WARN]\x1b[0m ${msg}`),
+  debug: (msg: string) => verbose && console.log(`\x1b[90m[DEBUG]\x1b[0m ${msg}`),
+  section: (msg: string) => console.log(`\n\x1b[1m=== ${msg} ===\x1b[0m`),
+};
+
+// Credentials extraction using sandbox-agent CLI
+function extractCredentials(): { anthropicApiKey?: string; openaiApiKey?: string } {
+  // First check environment variables
+  const envCreds = {
+    anthropicApiKey: process.env.ANTHROPIC_API_KEY,
+    openaiApiKey: process.env.OPENAI_API_KEY,
+  };
+
+  // If both are set in env, use them
+  if (envCreds.anthropicApiKey && envCreds.openaiApiKey) {
+    return envCreds;
+  }
+
+  // Try to extract using sandbox-agent CLI
+  try {
+    const binaryPath = join(ROOT_DIR, "target/release/sandbox-agent");
+    const debugBinaryPath = join(ROOT_DIR, "target/debug/sandbox-agent");
+    const binary = existsSync(binaryPath) ? binaryPath : existsSync(debugBinaryPath) ? debugBinaryPath : null;
+
+    if (binary) {
+      const output = execSync(`${binary} credentials extract-env --export`, {
+        encoding: "utf-8",
+        stdio: ["pipe", "pipe", "pipe"],
+      });
+
+      // Parse export statements: export KEY="value"
+      for (const line of output.split("\n")) {
+        const match = line.match(/^export (\w+)="(.*)"/);
+        if (match) {
+          const [, key, value] = match;
+          if (key === "ANTHROPIC_API_KEY" && !envCreds.anthropicApiKey) {
+            envCreds.anthropicApiKey = value;
+          } else if (key === "OPENAI_API_KEY" && !envCreds.openaiApiKey) {
+            envCreds.openaiApiKey = value;
+          }
+        }
+      }
+      log.debug(`Extracted credentials via sandbox-agent CLI`);
+    }
+  } catch (err) {
+    log.debug(`Failed to extract credentials via CLI: ${err}`);
+  }
+
+  return envCreds;
+}
+
+function getAnthropicApiKey(): string | undefined {
+  return extractCredentials().anthropicApiKey;
+}
+
+function getOpenAiApiKey(): string | undefined {
+  return extractCredentials().openaiApiKey;
+}
+
+// Build sandbox-agent
+async function buildSandboxAgent(): Promise<string> {
+  log.section("Building sandbox-agent");
+
+  if (useRelease) {
+    log.info("Using pre-built release from releases.rivet.dev");
+    return "RELEASE";
+  }
+
+  // Binary is in workspace root target dir, not server target dir
+  const binaryPath = join(ROOT_DIR, "target/release/sandbox-agent");
+
+  if (skipBuild) {
+    if (!existsSync(binaryPath)) {
+      throw new Error(`Binary not found at ${binaryPath}. Run without --skip-build.`);
+    }
+    log.info(`Using existing binary: ${binaryPath}`);
+    return binaryPath;
+  }
+
+  log.info("Running cargo build --release...");
+  try {
+    execSync("cargo build --release -p sandbox-agent", {
+      cwd: ROOT_DIR,
+      stdio: verbose ? "inherit" : "pipe",
+    });
+    log.success(`Built: ${binaryPath}`);
+    return binaryPath;
+  } catch (err) {
+    throw new Error(`Build failed: ${err}`);
+  }
+}
+
+// Provider interface
+interface SandboxProvider {
+  name: string;
+  requiredEnv: string[];
+  create(opts: { envVars: Record<string, string> }): Promise<Sandbox>;
+}
+
+interface Sandbox {
+  id: string;
+  exec(cmd: string): Promise<{ stdout: string; stderr: string; exitCode: number }>;
+  upload(localPath: string, remotePath: string): Promise<void>;
+  getBaseUrl(port: number): Promise<string>;
+  cleanup(): Promise<void>;
+}
+
+// Docker provider
+// Uses Ubuntu because Claude Code and sandbox-agent are glibc binaries
+const dockerProvider: SandboxProvider = {
+  name: "docker",
+  requiredEnv: [],
+  async create({ envVars }) {
+    const id = `sandbox-test-${Date.now()}`;
+    const envArgs = Object.entries(envVars)
+      .map(([k, v]) => `-e ${k}=${v}`)
+      .join(" ");
+
+    log.info(`Creating Docker container: ${id}`);
+    execSync(`docker run -d --name ${id} ${envArgs} -p 0:3000 ubuntu:22.04 tail -f /dev/null`, { stdio: verbose ? "inherit" : "pipe" });
+
+    // Install dependencies
+    execSync(`docker exec ${id} sh -c "apt-get update && apt-get install -y curl ca-certificates"`, {
+      stdio: verbose ? "inherit" : "pipe",
+    });
+
+    return {
+      id,
+      async exec(cmd) {
+        try {
+          const stdout = execSync(`docker exec ${id} sh -c "${cmd.replace(/"/g, '\\"')}"`, {
+            encoding: "utf-8",
+            stdio: ["pipe", "pipe", "pipe"],
+          });
+          return { stdout, stderr: "", exitCode: 0 };
+        } catch (err: any) {
+          return { stdout: err.stdout || "", stderr: err.stderr || "", exitCode: err.status || 1 };
+        }
+      },
+      async upload(localPath, remotePath) {
+        execSync(`docker cp "${localPath}" ${id}:${remotePath}`, { stdio: verbose ? "inherit" : "pipe" });
+        execSync(`docker exec ${id} chmod +x ${remotePath}`, { stdio: verbose ? "inherit" : "pipe" });
+      },
+      async getBaseUrl(port) {
+        const portMapping = execSync(`docker port ${id} ${port}`, { encoding: "utf-8" }).trim();
+        const hostPort = portMapping.split(":").pop();
+        return `http://localhost:${hostPort}`;
+      },
+      async cleanup() {
+        log.info(`Cleaning up container: ${id}`);
+        execSync(`docker rm -f ${id}`, { stdio: "pipe" });
+      },
+    };
+  },
+};
+
+// Daytona provider
+const daytonaProvider: SandboxProvider = {
+  name: "daytona",
+  requiredEnv: ["DAYTONA_API_KEY"],
+  async create({ envVars }) {
+    const { Daytona } = await import("@daytonaio/sdk");
+    const daytona = new Daytona();
+
+    log.info("Creating Daytona sandbox...");
+    // NOTE: Tier 1/2 sandboxes have restricted network that cannot be overridden
+    // networkAllowList requires CIDR notation (IP ranges), not domain names
+    const sandbox = await daytona.create({
+      image: "ubuntu:22.04",
+      envVars,
+    });
+    const id = sandbox.id;
+
+    // Install curl
+    await sandbox.process.executeCommand("apt-get update && apt-get install -y curl ca-certificates");
+
+    return {
+      id,
+      async exec(cmd) {
+        const result = await sandbox.process.executeCommand(cmd);
+        // Daytona SDK returns: { exitCode, result: string, artifacts: { stdout: string } }
+        return {
+          stdout: result.result || "",
+          stderr: "",
+          exitCode: result.exitCode ?? 0,
+        };
+      },
+      async upload(localPath, remotePath) {
+        const content = readFileSync(localPath);
+        // Daytona SDK signature: uploadFile(Buffer, remotePath)
+        await sandbox.fs.uploadFile(content, remotePath);
+        await sandbox.process.executeCommand(`chmod +x ${remotePath}`);
+      },
+      async getBaseUrl(port) {
+        const preview = await sandbox.getSignedPreviewUrl(port, 4 * 60 * 60);
+        return preview.url;
+      },
+      async cleanup() {
+        log.info(`Cleaning up Daytona sandbox: ${id}`);
+        await sandbox.delete(60);
+      },
+    };
+  },
+};
+
+// E2B provider
+const e2bProvider: SandboxProvider = {
+  name: "e2b",
+  requiredEnv: ["E2B_API_KEY"],
+  async create({ envVars }) {
+    const { Sandbox } = await import("@e2b/code-interpreter");
+
+    log.info("Creating E2B sandbox...");
+    let sandbox;
+    try {
+      sandbox = await Sandbox.create({
+        allowInternetAccess: true,
+        envs: envVars,
+      });
+    } catch (err: any) {
+      log.error(`E2B sandbox creation failed: ${err.message || err}`);
+      throw err;
+    }
+    const id = sandbox.sandboxId;
+
+    // Install curl (E2B uses Debian which has glibc, sandbox-agent will auto-detect)
+    const installResult = await sandbox.commands.run("sudo apt-get update && sudo apt-get install -y curl ca-certificates");
+    log.debug(`Install output: ${installResult.stdout} ${installResult.stderr}`);
+
+    return {
+      id,
+      async exec(cmd) {
+        const result = await sandbox.commands.run(cmd);
+        return {
+          stdout: result.stdout || "",
+          stderr: result.stderr || "",
+          exitCode: result.exitCode,
+        };
+      },
+      async upload(localPath, remotePath) {
+        const content = readFileSync(localPath);
+        await sandbox.files.write(remotePath, content);
+        await sandbox.commands.run(`chmod +x ${remotePath}`);
+      },
+      async getBaseUrl(port) {
+        return `https://${sandbox.getHost(port)}`;
+      },
+      async cleanup() {
+        log.info(`Cleaning up E2B sandbox: ${id}`);
+        await sandbox.kill();
+      },
+    };
+  },
+};
+
+// Get provider
+function getProvider(name: string): SandboxProvider {
+  switch (name) {
+    case "docker":
+      return dockerProvider;
+    case "daytona":
+      return daytonaProvider;
+    case "e2b":
+      return e2bProvider;
+    default:
+      throw new Error(`Unknown provider: ${name}. Available: docker, daytona, e2b`);
+  }
+}
+
+// Install sandbox-agent in sandbox
+async function installSandboxAgent(sandbox: Sandbox, binaryPath: string): Promise<void> {
+  log.section("Installing sandbox-agent");
+
+  if (binaryPath === "RELEASE") {
+    log.info("Installing from releases.rivet.dev...");
+    const result = await sandbox.exec("curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh");
+    log.debug(`Install output: ${result.stdout}`);
+    if (result.exitCode !== 0) {
+      throw new Error(`Install failed: ${result.stderr}`);
+    }
+  } else {
+    log.info(`Uploading local binary: ${binaryPath}`);
+    await sandbox.upload(binaryPath, "/usr/local/bin/sandbox-agent");
+  }
+
+  // Verify installation
+  const version = await sandbox.exec("sandbox-agent --version");
+  log.success(`Installed: ${version.stdout.trim()}`);
+}
+
+// Install agents
+async function installAgents(sandbox: Sandbox, agents: string[]): Promise<void> {
+  log.section("Installing agents");
+
+  for (const agent of agents) {
+    log.info(`Installing ${agent}...`);
+
+    if (agent === "claude" || agent === "codex") {
+      const result = await sandbox.exec(`sandbox-agent install-agent ${agent}`);
+      if (result.exitCode !== 0) throw new Error(`Failed to install ${agent}: ${result.stderr}`);
+      log.success(`Installed ${agent}`);
+    } else if (agent === "mock") {
+      // Mock agent is built into sandbox-agent, no install needed
+      log.info("Mock agent is built-in, skipping install");
+    }
+  }
+}
+
+// Start server and check health
+async function startServerAndCheckHealth(sandbox: Sandbox): Promise<string> {
+  log.section("Starting server");
+
+  // Start server in background
+  await sandbox.exec("nohup sandbox-agent server --no-token --host 0.0.0.0 --port 3000 >/tmp/sandbox-agent.log 2>&1 &");
+  log.info("Server started in background");
+
+  // Get base URL
+  const baseUrl = await sandbox.getBaseUrl(3000);
+  log.info(`Base URL: ${baseUrl}`);
+
+  // Wait for health
+  log.info("Waiting for health check...");
+  for (let i = 0; i < 30; i++) {
+    try {
+      const response = await fetch(`${baseUrl}/v1/health`);
+      if (response.ok) {
+        const data = await response.json();
+        if (data.status === "ok") {
+          log.success("Health check passed!");
+          return baseUrl;
+        }
+      }
+    } catch {}
+    await new Promise((r) => setTimeout(r, 1000));
+  }
+
+  // Show logs on failure
+  const logs = await sandbox.exec("cat /tmp/sandbox-agent.log");
+  log.error("Server logs:\n" + logs.stdout);
+  throw new Error("Health check failed after 30 seconds");
+}
+
+// Send a message and wait for response, auto-approving permissions
+// Returns the response text
+async function sendMessage(baseUrl: string, sessionId: string, message: string): Promise<string> {
+  log.info(`Sending message: "${message.slice(0, 60)}${message.length > 60 ? "..." : ""}"`);
+  const msgRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}/messages/stream`, {
+    method: "POST",
+    headers: { "Content-Type": "application/json" },
+    body: JSON.stringify({ message }),
+  });
+  if (!msgRes.ok || !msgRes.body) {
+    throw new Error(`Failed to send message: ${await msgRes.text()}`);
+  }
+
+  // Process SSE stream
+  const reader = msgRes.body.getReader();
+  const decoder = new TextDecoder();
+  let buffer = "";
+  let responseText = "";
+  let receivedText = false;
+  let hasError = false;
+  let errorMessage = "";
+  let pendingPermission: string | null = null;
+
+  while (true) {
+    const { done, value } = await reader.read();
+    if (done) break;
+
+    buffer += decoder.decode(value, { stream: true });
+    const lines = buffer.split("\n");
+    buffer = lines.pop() || "";
+
+    for (const line of lines) {
+      if (!line.startsWith("data: ")) continue;
+      const data = line.slice(6);
+      if (data === "[DONE]") continue;
+
+      try {
+        const event = JSON.parse(data);
+        log.debug(`Event: ${event.type}`);
+
+        if (event.type === "item.delta") {
+          const delta = event.data?.delta;
+          const text = typeof delta === "string" ? delta : delta?.text || "";
+          if (text) {
+            if (!receivedText) {
+              log.info("Receiving response...");
+              receivedText = true;
+            }
+            process.stdout.write(text);
+            responseText += text;
+          }
+        }
+
+        // Handle permission requests - auto-approve
+        if (event.type === "permission.requested") {
+          const permissionId = event.data?.permission_id;
+          if (permissionId) {
+            pendingPermission = permissionId;
+            log.info(`Permission requested (${permissionId}), auto-approving...`);
+          }
+        }
+
+        if (event.type === "error") {
+          hasError = true;
+          errorMessage = event.data?.message || JSON.stringify(event.data);
+          log.error(`Error event: ${errorMessage}`);
+        }
+
+        if (event.type === "agent.unparsed") {
+          hasError = true;
+          errorMessage = `Agent unparsed: ${JSON.stringify(event.data)}`;
+          log.error(errorMessage);
+        }
+      } catch {}
+    }
+
+    // If we have a pending permission, approve it
+    if (pendingPermission) {
+      const permId = pendingPermission;
+      pendingPermission = null;
+      try {
+        const approveRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}/permissions/${permId}/reply`, {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({ reply: "once" }),
+        });
+        if (approveRes.ok) {
+          log.success(`Permission ${permId} approved`);
+        } else {
+          log.warn(`Failed to approve permission: ${await approveRes.text()}`);
+        }
+      } catch (err) {
+        log.warn(`Error approving permission: ${err}`);
+      }
+    }
+  }
+
+  if (receivedText) {
+    console.log(); // newline after response
+  }
+
+  if (hasError) {
+    throw new Error(`Agent returned error: ${errorMessage}`);
+  }
+
+  return responseText;
+}
+
+// Test agent interaction
+async function testAgent(baseUrl: string, agent: string, message: string): Promise<void> {
+  log.section(`Testing ${agent} agent`);
+
+  const sessionId = crypto.randomUUID();
+
+  // Create session
+  log.info(`Creating session ${sessionId}...`);
+  const createRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}`, {
+    method: "POST",
+    headers: { "Content-Type": "application/json" },
+    body: JSON.stringify({ agent }),
+  });
+  if (!createRes.ok) {
+    throw new Error(`Failed to create session: ${await createRes.text()}`);
+  }
+  log.success("Session created");
+
+  const response = await sendMessage(baseUrl, sessionId, message);
+  if (!response) {
+    throw new Error("No response received from agent");
+  }
+  log.success("Received response from agent");
+}
+
+// Test that agent can actually modify files and run commands
+async function testAgentActions(baseUrl: string, agent: string, sandbox: Sandbox): Promise<void> {
+  log.section(`Testing ${agent} agent actions (file + command)`);
+
+  const sessionId = crypto.randomUUID();
+  const testFile = "/tmp/sandbox-test-file.txt";
+  const expectedContent = "Hello from sandbox test!";
+
+  // For Claude running as root in containers, we must use default permission mode
+  // and handle permissions via the API (bypass mode is not supported as root).
+  // For other agents, we can use bypass mode.
+  const permissionMode = agent === "claude" ? "default" : "bypass";
+  log.info(`Creating session ${sessionId} with permissionMode=${permissionMode}...`);
+  const createRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}`, {
+    method: "POST",
+    headers: { "Content-Type": "application/json" },
+    body: JSON.stringify({ agent, permissionMode }),
+  });
+  if (!createRes.ok) {
+    throw new Error(`Failed to create session: ${await createRes.text()}`);
+  }
+  log.success("Session created");
+
+  // Ask agent to create a file
+  const fileMessage = `Create a file at ${testFile} with exactly this content (no quotes, no extra text): ${expectedContent}`;
+  await sendMessage(baseUrl, sessionId, fileMessage);
+
+  // Wait for agent to complete action after permission approval
+  log.info("Waiting for agent to complete action...");
+  await new Promise((r) => setTimeout(r, 5000));
+
+  // Verify file was created
+  log.info("Verifying file was created...");
+  const fileCheck = await sandbox.exec(`cat ${testFile} 2>&1`);
+  if (fileCheck.exitCode !== 0) {
+    throw new Error(`File was not created: ${fileCheck.stderr || fileCheck.stdout}`);
+  }
+  if (!fileCheck.stdout.includes("Hello from sandbox test")) {
+    throw new Error(`File content mismatch. Expected "${expectedContent}", got "${fileCheck.stdout.trim()}"`);
+  }
+  log.success(`File created with correct content: "${fileCheck.stdout.trim()}"`);
+
+  // Ask agent to run a command and create output
+  const cmdMessage = `Run this command and tell me the output: echo "command-test-$(date +%s)" > /tmp/cmd-output.txt && cat /tmp/cmd-output.txt`;
+  await sendMessage(baseUrl, sessionId, cmdMessage);
+
+  // Verify command was executed
+  log.info("Verifying command was executed...");
+  const cmdCheck = await sandbox.exec("cat /tmp/cmd-output.txt 2>&1");
+  if (cmdCheck.exitCode !== 0) {
+    throw new Error(`Command output file not found: ${cmdCheck.stderr || cmdCheck.stdout}`);
+  }
+  if (!cmdCheck.stdout.includes("command-test-")) {
+    throw new Error(`Command output mismatch. Expected "command-test-*", got "${cmdCheck.stdout.trim()}"`);
+  }
+  log.success(`Command executed successfully: "${cmdCheck.stdout.trim()}"`);
+}
+
+// Check environment diagnostics
+async function checkEnvironment(sandbox: Sandbox): Promise<void> {
+  log.section("Environment diagnostics");
+
+  const checks = [
+    { name: "Environment variables", cmd: "env | grep -E 'ANTHROPIC|OPENAI|CLAUDE|CODEX' | sed 's/=.*/=<set>/'" },
+    // Check both /root (Alpine) and /home/user (E2B/Debian) paths
+    {
+      name: "Agent binaries",
+      cmd: "ls -la ~/.local/share/sandbox-agent/bin/ 2>/dev/null || ls -la /root/.local/share/sandbox-agent/bin/ 2>/dev/null || ls -la /home/user/.local/share/sandbox-agent/bin/ 2>/dev/null || echo 'No agents installed'",
+    },
+    {
+      name: "Claude version",
+      cmd: "~/.local/share/sandbox-agent/bin/claude --version 2>&1 || /root/.local/share/sandbox-agent/bin/claude --version 2>&1 || echo 'Claude not installed'",
+    },
+    { name: "sandbox-agent version", cmd: "sandbox-agent --version 2>/dev/null || echo 'Not installed'" },
+    { name: "Server process", cmd: "pgrep -a sandbox-agent 2>/dev/null || ps aux | grep sandbox-agent | grep -v grep || echo 'Not running'" },
+    { name: "Server logs (last 50 lines)", cmd: "tail -50 /tmp/sandbox-agent.log 2>/dev/null || echo 'No logs'" },
+    {
+      name: "Network: api.anthropic.com",
+      cmd: "curl -s -o /dev/null -w '%{http_code}' --connect-timeout 5 https://api.anthropic.com/v1/messages 2>&1 || echo 'UNREACHABLE'",
+    },
+    {
+      name: "Network: api.openai.com",
+      cmd: "curl -s -o /dev/null -w '%{http_code}' --connect-timeout 5 https://api.openai.com/v1/models 2>&1 || echo 'UNREACHABLE'",
+    },
+  ];
+
+  for (const { name, cmd } of checks) {
+    const result = await sandbox.exec(cmd);
+    console.log(`\n\x1b[1m${name}:\x1b[0m`);
+    console.log(result.stdout || "(empty)");
+    if (result.stderr) console.log(`stderr: ${result.stderr}`);
+  }
+}
+
+// Main
+async function main() {
+  log.section(`Sandbox Testing (provider: ${provider})`);
+
+  // Check credentials
+  const anthropicKey = getAnthropicApiKey();
+  const openaiKey = getOpenAiApiKey();
+
+  log.info(`Anthropic API key: ${anthropicKey ? "found" : "not found"}`);
+  log.info(`OpenAI API key: ${openaiKey ? "found" : "not found"}`);
+
+  // Determine which agents to test
+  let agents: string[];
+  if (agentArg) {
+    agents = [agentArg];
+  } else if (anthropicKey) {
+    agents = ["claude"];
+  } else if (openaiKey) {
+    agents = ["codex"];
+  } else {
+    agents = ["mock"];
+    log.warn("No API keys found, using mock agent only");
+  }
+  log.info(`Agents to test: ${agents.join(", ")}`);
+
+  // Get provider
+  const prov = getProvider(provider);
+
+  // Check required env vars
+  for (const envVar of prov.requiredEnv) {
+    if (!process.env[envVar]) {
+      throw new Error(`Missing required environment variable: ${envVar}`);
+    }
+  }
+
+  // Build
+  const binaryPath = await buildSandboxAgent();
+
+  // Create sandbox
+  log.section(`Creating ${prov.name} sandbox`);
+  const envVars: Record<string, string> = {};
+  if (anthropicKey) envVars.ANTHROPIC_API_KEY = anthropicKey;
+  if (openaiKey) envVars.OPENAI_API_KEY = openaiKey;
+
+  const sandbox = await prov.create({ envVars });
+  log.success(`Created sandbox: ${sandbox.id}`);
+
+  try {
+    // Install sandbox-agent
+    await installSandboxAgent(sandbox, binaryPath);
+
+    // Install agents (unless --skip-agent-install to test on-demand install like Daytona example)
+    if (skipAgentInstall) {
+      log.info("Skipping agent pre-install (testing on-demand installation)");
+    } else {
+      await installAgents(sandbox, agents);
+    }
+
+    // Check environment
+    await checkEnvironment(sandbox);
+
+    // Start server and check health
+    const baseUrl = await startServerAndCheckHealth(sandbox);
+
+    // Test each agent
+    for (const agent of agents) {
+      // Basic response test
+      const message = agent === "mock" ? "hello" : "Say hello in 10 words or less";
+      await testAgent(baseUrl, agent, message);
+
+      // For real agents, also test file/command actions with permission handling.
+      // Claude uses default permission mode and we auto-approve via API.
+      // Other agents can use bypass mode.
+      if (agent !== "mock") {
+        await testAgentActions(baseUrl, agent, sandbox);
+      }
+    }
+
+    log.section("All tests passed!");
+
+    if (keepAlive) {
+      log.info(`Sandbox ${sandbox.id} is still running. Press Ctrl+C to cleanup.`);
+      log.info(`Base URL: ${await sandbox.getBaseUrl(3000)}`);
+      await new Promise(() => {}); // Wait forever
+    }
+  } catch (err) {
+    log.error(`Test failed: ${err}`);
+
+    // Show diagnostics on failure
+    try {
+      await checkEnvironment(sandbox);
+    } catch {}
+
+    if (!keepAlive) {
+      await sandbox.cleanup();
+    }
+    process.exit(1);
+  }
+
+  if (!keepAlive) {
+    await sandbox.cleanup();
+  }
+}
+
+main().catch((err) => {
+  log.error(err.message || err);
+  process.exit(1);
+});
--- a/sdks/acp-http-client/package.json
+++ b/sdks/acp-http-client/package.json
@ -1,6 +1,6 @@
 {
  "name": "acp-http-client",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "Protocol-faithful ACP JSON-RPC over streamable HTTP client.",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli-shared/package.json
+++ b/sdks/cli-shared/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-shared",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "Shared helpers for sandbox-agent CLI and SDK",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/package.json
+++ b/sdks/cli/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "CLI for sandbox-agent - run AI coding agents in sandboxes",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/darwin-arm64/package.json
+++ b/sdks/cli/platforms/darwin-arm64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-darwin-arm64",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "sandbox-agent CLI binary for macOS ARM64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/darwin-x64/package.json
+++ b/sdks/cli/platforms/darwin-x64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-darwin-x64",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "sandbox-agent CLI binary for macOS x64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/linux-arm64/package.json
+++ b/sdks/cli/platforms/linux-arm64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-linux-arm64",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "sandbox-agent CLI binary for Linux arm64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/linux-x64/package.json
+++ b/sdks/cli/platforms/linux-x64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-linux-x64",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "sandbox-agent CLI binary for Linux x64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/win32-x64/package.json
+++ b/sdks/cli/platforms/win32-x64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-win32-x64",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "sandbox-agent CLI binary for Windows x64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/gigacode/package.json
+++ b/sdks/gigacode/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/gigacode",
-  "version": "0.4.2",
+  "version": "0.5.0-rc.1",
  "description": "Gigacode CLI (sandbox-agent with OpenCode attach by default)",
  "license": "Apache-2.0",
  "repository": {
--- a/Show more
+++ b/Show more