docs: clean up orphaned docs and add session event types

Delete orphaned docs not in docs.json navigation (gigacode.mdx, foundry-self-hosting.mdx, session-transcript-schema.mdx, pi-support-plan.md). Remove outdated musl/glibc troubleshooting section. Add event types documentation with example payloads to agent-sessions.mdx. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
chore(release): update version to 0.4.2
2026-04-15 06:04:43 +00:00 · 2026-03-25 19:11:19 -07:00 · 2026-03-25 18:07:26 -07:00 · 2026-03-25 17:00:51 -04:00 · 2026-03-25 16:54:40 -04:00 · 2026-03-25 13:20:57 -07:00
131 changed files with 1663 additions and 2228 deletions
--- a/.claude/commands/post-release-testing.md
+++ b/.claude/commands/post-release-testing.md
@ -43,7 +43,7 @@ Manually verify the install script works in a fresh environment:
 ```bash
 docker run --rm alpine:latest sh -c "
  apk add --no-cache curl ca-certificates libstdc++ libgcc bash &&
-  curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh &&
+  curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh &&
  sandbox-agent --version
 "
 ```
--- a/CLAUDE.md
+++ b/CLAUDE.md
@ -20,7 +20,7 @@
 - For HTTP/CLI docs/examples, source of truth is:
  - `server/packages/sandbox-agent/src/router.rs`
  - `server/packages/sandbox-agent/src/cli.rs`
- Keep docs aligned to implemented endpoints/commands only (for example ACP under `/v1/acp`, not legacy `/v1/sessions` APIs).
+- Keep docs aligned to implemented endpoints/commands only (for example ACP under `/v1/acp`, not legacy session REST APIs).

 ## Change Tracking

@ -78,4 +78,3 @@
  - `scripts/release/main.ts`
  - `scripts/release/promote-artifacts.ts`
  - `scripts/release/sdk.ts`
-  - `scripts/sandbox-testing/test-sandbox.ts`
--- a/Cargo.toml
+++ b/Cargo.toml
@ -4,7 +4,7 @@ members = ["server/packages/*", "gigacode"]
 exclude = ["factory/packages/desktop/src-tauri", "foundry/packages/desktop/src-tauri"]

 [workspace.package]
-version = "0.5.0-rc.1"
+version = "0.4.2"
 edition = "2021"
 authors = [ "Rivet Gaming, LLC <developer@rivet.gg>" ]
 license = "Apache-2.0"
@ -13,13 +13,13 @@ description = "Universal API for automatic coding agents in sandboxes. Supports

 [workspace.dependencies]
 # Internal crates
-sandbox-agent = { version = "0.5.0-rc.1", path = "server/packages/sandbox-agent" }
-sandbox-agent-error = { version = "0.5.0-rc.1", path = "server/packages/error" }
-sandbox-agent-agent-management = { version = "0.5.0-rc.1", path = "server/packages/agent-management" }
-sandbox-agent-agent-credentials = { version = "0.5.0-rc.1", path = "server/packages/agent-credentials" }
-sandbox-agent-opencode-adapter = { version = "0.5.0-rc.1", path = "server/packages/opencode-adapter" }
-sandbox-agent-opencode-server-manager = { version = "0.5.0-rc.1", path = "server/packages/opencode-server-manager" }
-acp-http-adapter = { version = "0.5.0-rc.1", path = "server/packages/acp-http-adapter" }
+sandbox-agent = { version = "0.4.2", path = "server/packages/sandbox-agent" }
+sandbox-agent-error = { version = "0.4.2", path = "server/packages/error" }
+sandbox-agent-agent-management = { version = "0.4.2", path = "server/packages/agent-management" }
+sandbox-agent-agent-credentials = { version = "0.4.2", path = "server/packages/agent-credentials" }
+sandbox-agent-opencode-adapter = { version = "0.4.2", path = "server/packages/opencode-adapter" }
+sandbox-agent-opencode-server-manager = { version = "0.4.2", path = "server/packages/opencode-server-manager" }
+acp-http-adapter = { version = "0.4.2", path = "server/packages/acp-http-adapter" }

 # Serialization
 serde = { version = "1.0", features = ["derive"] }
--- a/README.md
+++ b/README.md
@ -80,11 +80,11 @@ Import the SDK directly into your Node or browser application. Full type safety
 **Install**

 ```bash
-npm install sandbox-agent@0.3.x
+npm install sandbox-agent@0.4.x
 ```

 ```bash
-bun add sandbox-agent@0.3.x
+bun add sandbox-agent@0.4.x
 # Optional: allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
 bun pm trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
 ```
@ -135,7 +135,7 @@ Run as an HTTP server and connect from any language. Deploy to E2B, Daytona, Ver

 ```bash
 # Install it
-curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
 # Run it
 sandbox-agent server --token "$SANDBOX_TOKEN" --host 127.0.0.1 --port 2468
 ```
@ -159,12 +159,12 @@ sandbox-agent server --no-token --host 127.0.0.1 --port 2468
 Install the CLI wrapper (optional but convenient):

 ```bash
-npm install -g @sandbox-agent/cli@0.3.x
+npm install -g @sandbox-agent/cli@0.4.x
 ```

 ```bash
 # Allow Bun to run postinstall scripts for native binaries.
-bun add -g @sandbox-agent/cli@0.3.x
+bun add -g @sandbox-agent/cli@0.4.x
 bun pm -g trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
 ```

@ -179,11 +179,11 @@ sandbox-agent api sessions send-message-stream my-session --message "Hello" --en
 You can also use npx like:

 ```bash
-npx @sandbox-agent/cli@0.3.x --help
+npx @sandbox-agent/cli@0.4.x --help
 ```

 ```bash
-bunx @sandbox-agent/cli@0.3.x --help
+bunx @sandbox-agent/cli@0.4.x --help
 ```

 [CLI documentation](https://sandboxagent.dev/docs/cli)
--- a/docs/agent-sessions.mdx
+++ b/docs/agent-sessions.mdx
@ -51,6 +51,108 @@ await session.prompt([
 unsubscribe();
 ```

+### Event types
+
+Each event's `payload` contains a session update. The `sessionUpdate` field identifies the type.
+
+<AccordionGroup>
+<Accordion title="agent_message_chunk">
+Streamed text or content from the agent's response.
+
+```json
+{
+  "sessionUpdate": "agent_message_chunk",
+  "content": { "type": "text", "text": "Here's how the repository is structured..." }
+}
+```
+</Accordion>
+
+<Accordion title="agent_thought_chunk">
+Internal reasoning from the agent (chain-of-thought / extended thinking).
+
+```json
+{
+  "sessionUpdate": "agent_thought_chunk",
+  "content": { "type": "text", "text": "I should start by looking at the project structure..." }
+}
+```
+</Accordion>
+
+<Accordion title="user_message_chunk">
+Echo of the user's prompt being processed.
+
+```json
+{
+  "sessionUpdate": "user_message_chunk",
+  "content": { "type": "text", "text": "Summarize the repository structure." }
+}
+```
+</Accordion>
+
+<Accordion title="tool_call">
+The agent invoked a tool (file edit, terminal command, etc.).
+
+```json
+{
+  "sessionUpdate": "tool_call",
+  "toolCallId": "tc_abc123",
+  "title": "Read file",
+  "status": "in_progress",
+  "rawInput": { "path": "/src/index.ts" }
+}
+```
+</Accordion>
+
+<Accordion title="tool_call_update">
+Progress or result update for an in-progress tool call.
+
+```json
+{
+  "sessionUpdate": "tool_call_update",
+  "toolCallId": "tc_abc123",
+  "status": "completed",
+  "content": [{ "type": "text", "text": "import express from 'express';\n..." }]
+}
+```
+</Accordion>
+
+<Accordion title="plan">
+The agent's execution plan for the current task.
+
+```json
+{
+  "sessionUpdate": "plan",
+  "entries": [
+    { "content": "Read the project structure", "status": "completed" },
+    { "content": "Identify main entrypoints", "status": "in_progress" },
+    { "content": "Write summary", "status": "pending" }
+  ]
+}
+```
+</Accordion>
+
+<Accordion title="usage_update">
+Token usage metrics for the current turn.
+
+```json
+{
+  "sessionUpdate": "usage_update"
+}
+```
+</Accordion>
+
+<Accordion title="session_info_update">
+Session metadata changed (e.g. agent-generated title).
+
+```json
+{
+  "sessionUpdate": "session_info_update",
+  "title": "Repository structure analysis"
+}
+```
+</Accordion>
+</AccordionGroup>
+
 ## Fetch persisted event history

 ```ts
--- a/docs/architecture.mdx
+++ b/docs/architecture.mdx
@ -56,7 +56,7 @@ Agents are installed lazily on first use. To avoid the cold-start delay, pre-ins
 sandbox-agent install-agent --all
 ```

-The `rivetdev/sandbox-agent:0.5.0-rc.1-full` Docker image ships with all agents pre-installed.
+The `rivetdev/sandbox-agent:0.4.2-full` Docker image ships with all agents pre-installed.

 ## Production-ready agent orchestration

--- a/docs/deploy/boxlite.mdx
+++ b/docs/deploy/boxlite.mdx
@ -20,7 +20,7 @@ that BoxLite can load directly (BoxLite has its own image store separate from Do
 ```dockerfile
 FROM node:22-bookworm-slim
 RUN apt-get update && apt-get install -y curl ca-certificates && rm -rf /var/lib/apt/lists/*
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
 RUN sandbox-agent install-agent claude
 RUN sandbox-agent install-agent codex
 ```
--- a/docs/deploy/cloudflare.mdx
+++ b/docs/deploy/cloudflare.mdx
@ -25,7 +25,7 @@ cd my-sandbox
 ```dockerfile
 FROM cloudflare/sandbox:0.7.0

-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
 RUN sandbox-agent install-agent claude && sandbox-agent install-agent codex

 EXPOSE 8000
@ -36,7 +36,7 @@ EXPOSE 8000
 For standalone scripts, use the `cloudflare` provider:

 ```bash
-npm install sandbox-agent@0.3.x @cloudflare/sandbox
+npm install sandbox-agent@0.4.x @cloudflare/sandbox
 ```

 ```typescript
--- a/docs/deploy/computesdk.mdx
+++ b/docs/deploy/computesdk.mdx
@ -14,7 +14,7 @@ description: "Deploy Sandbox Agent using ComputeSDK's provider-agnostic sandbox
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.3.x computesdk
+npm install sandbox-agent@0.4.x computesdk
 ```

 ```typescript
@ -27,7 +27,11 @@ if (process.env.OPENAI_API_KEY) envs.OPENAI_API_KEY = process.env.OPENAI_API_KEY

 const sdk = await SandboxAgent.start({
  sandbox: computesdk({
-    create: { envs },
+    create: {
+      envs,
+      image: process.env.COMPUTESDK_IMAGE,
+      templateId: process.env.COMPUTESDK_TEMPLATE_ID,
+    },
  }),
 });

@ -43,6 +47,7 @@ try {
 ```

 The `computesdk` provider handles sandbox creation, Sandbox Agent installation, agent setup, and server startup automatically. ComputeSDK routes to your configured provider behind the scenes.
+The `create` option now forwards the full ComputeSDK sandbox-create payload, including provider-specific fields such as `image` and `templateId` when the selected provider supports them.

 Before calling `SandboxAgent.start()`, configure ComputeSDK with your provider:

--- a/docs/deploy/daytona.mdx
+++ b/docs/deploy/daytona.mdx
@ -16,7 +16,7 @@ See [Daytona network limits](https://www.daytona.io/docs/en/network-limits/).
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.3.x @daytonaio/sdk
+npm install sandbox-agent@0.4.x @daytonaio/sdk
 ```

 ```typescript
@ -44,7 +44,7 @@ try {
 }
 ```

-The `daytona` provider uses the `rivetdev/sandbox-agent:0.5.0-rc.1-full` image by default and starts the server automatically.
+The `daytona` provider uses the `rivetdev/sandbox-agent:0.4.2-full` image by default and starts the server automatically.

 ## Using snapshots for faster startup

@ -61,7 +61,7 @@ if (!hasSnapshot) {
    name: SNAPSHOT,
    image: Image.base("ubuntu:22.04").runCommands(
      "apt-get update && apt-get install -y curl ca-certificates",
-      "curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh",
+      "curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh",
      "sandbox-agent install-agent claude",
      "sandbox-agent install-agent codex",
    ),
--- a/docs/deploy/docker.mdx
+++ b/docs/deploy/docker.mdx
@ -15,11 +15,11 @@ Run the published full image with all supported agents pre-installed:
 docker run --rm -p 3000:3000 \
  -e ANTHROPIC_API_KEY="$ANTHROPIC_API_KEY" \
  -e OPENAI_API_KEY="$OPENAI_API_KEY" \
-  rivetdev/sandbox-agent:0.5.0-rc.1-full \
+  rivetdev/sandbox-agent:0.4.2-full \
  server --no-token --host 0.0.0.0 --port 3000
 ```

-The `0.5.0-rc.1-full` tag pins the exact version. The moving `full` tag is also published for contributors who want the latest full image.
+The `0.4.2-full` tag pins the exact version. The moving `full` tag is also published for contributors who want the latest full image.

 If you also want the desktop API inside the container, install desktop dependencies before starting the server:

@ -31,7 +31,7 @@ docker run --rm -p 3000:3000 \
    apt-get update && \
    DEBIAN_FRONTEND=noninteractive apt-get install -y curl ca-certificates bash libstdc++6 && \
    rm -rf /var/lib/apt/lists/* && \
-    curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh && \
+    curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh && \
    sandbox-agent install desktop --yes && \
    sandbox-agent server --no-token --host 0.0.0.0 --port 3000"
 ```
@ -52,7 +52,7 @@ const docker = new Docker();
 const PORT = 3000;

 const container = await docker.createContainer({
-  Image: "rivetdev/sandbox-agent:0.5.0-rc.1-full",
+  Image: "rivetdev/sandbox-agent:0.4.2-full",
  Cmd: ["server", "--no-token", "--host", "0.0.0.0", "--port", `${PORT}`],
  Env: [
    `ANTHROPIC_API_KEY=${process.env.ANTHROPIC_API_KEY}`,
@ -86,7 +86,7 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
    bash ca-certificates curl git && \
    rm -rf /var/lib/apt/lists/*

-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh && \
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh && \
    sandbox-agent install-agent --all

 RUN useradd -m -s /bin/bash sandbox
--- a/docs/deploy/e2b.mdx
+++ b/docs/deploy/e2b.mdx
@ -11,7 +11,7 @@ description: "Deploy Sandbox Agent inside an E2B sandbox."
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.3.x @e2b/code-interpreter
+npm install sandbox-agent@0.4.x @e2b/code-interpreter
 ```

 ```typescript
@ -21,9 +21,11 @@ import { e2b } from "sandbox-agent/e2b";
 const envs: Record<string, string> = {};
 if (process.env.ANTHROPIC_API_KEY) envs.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
 if (process.env.OPENAI_API_KEY) envs.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
+const template = process.env.E2B_TEMPLATE;

 const sdk = await SandboxAgent.start({
  sandbox: e2b({
+    template,
    create: { envs },
  }),
 });
@ -41,7 +43,10 @@ try {

 The `e2b` provider handles sandbox creation, Sandbox Agent installation, agent setup, and server startup automatically. Sandboxes pause by default instead of being deleted, and reconnecting with the same `sandboxId` resumes them automatically.

+Pass `template` when you want to start from a custom E2B template alias or template ID. E2B base-image selection happens when you build the template, then `sandbox-agent/e2b` uses that template at sandbox creation time.
+
 ## Faster cold starts

 For faster startup, create a custom E2B template with Sandbox Agent and target agents pre-installed.
-See [E2B Custom Templates](https://e2b.dev/docs/sandbox-template).
+Build System 2.0 also lets you choose the template's base image in code.
+See [E2B Custom Templates](https://e2b.dev/docs/sandbox-template) and [E2B Base Images](https://e2b.dev/docs/template/base-image).
--- a/docs/deploy/foundry-self-hosting.mdx
+++ b/docs/deploy/foundry-self-hosting.mdx
@ -1,155 +0,0 @@
---
-title: "Foundry Self-Hosting"
-description: "Environment, credentials, and deployment setup for Sandbox Agent Foundry auth, GitHub, and billing."
---
-
-This guide documents the deployment contract for the Foundry product surface: app auth, GitHub onboarding, repository import, and billing.
-
-It also covers the local-development bootstrap that uses `.env.development` only when `NODE_ENV=development`.
-
-## Local Development
-
-For backend local development, the Foundry backend now supports a development-only dotenv bootstrap:
-
- It loads `.env.development.local` and `.env.development`
- It does this **only** when `NODE_ENV=development`
- It does **not** load dotenv files in production
-
-The example file lives at [`/.env.development.example`](https://github.com/rivet-dev/sandbox-agent/blob/main/.env.development.example).
-
-To use it locally:
-
-```bash
-cp .env.development.example .env.development
-```
-
-Run the backend with:
-
-```bash
-just foundry-backend-start
-```
-
-That recipe sets `NODE_ENV=development`, which enables the dotenv loader.
-
-### Local Defaults
-
-These values can be safely defaulted for local development:
-
- `APP_URL=http://localhost:4173`
- `BETTER_AUTH_URL=http://localhost:7741`
- `BETTER_AUTH_SECRET=sandbox-agent-foundry-development-only-change-me`
- `GITHUB_REDIRECT_URI=http://localhost:7741/v1/auth/callback/github`
-
-These should be treated as development-only values.
-
-## Production Environment
-
-For production or self-hosting, set these as real environment variables in your deployment platform. Do not rely on dotenv file loading.
-
-### App/Auth
-
-| Variable | Required | Notes |
-|---|---:|---|
-| `APP_URL` | Yes | Public frontend origin |
-| `BETTER_AUTH_URL` | Yes | Public auth base URL |
-| `BETTER_AUTH_SECRET` | Yes | Strong random secret for auth/session signing |
-
-### GitHub OAuth
-
-| Variable | Required | Notes |
-|---|---:|---|
-| `GITHUB_CLIENT_ID` | Yes | GitHub OAuth app client id |
-| `GITHUB_CLIENT_SECRET` | Yes | GitHub OAuth app client secret |
-| `GITHUB_REDIRECT_URI` | Yes | GitHub OAuth callback URL |
-
-Use GitHub OAuth for:
-
- user sign-in
- user identity
- org selection
- access to the signed-in user’s GitHub context
-
-## GitHub App
-
-If your Foundry deployment uses GitHub App-backed organization install and repo import, also configure:
-
-| Variable | Required | Notes |
-|---|---:|---|
-| `GITHUB_APP_ID` | Yes | GitHub App id |
-| `GITHUB_APP_CLIENT_ID` | Yes | GitHub App client id |
-| `GITHUB_APP_CLIENT_SECRET` | Yes | GitHub App client secret |
-| `GITHUB_APP_PRIVATE_KEY` | Yes | PEM private key for installation auth |
-
-For `.env.development` and `.env.development.local`, store `GITHUB_APP_PRIVATE_KEY` as a quoted single-line value with `\n` escapes instead of raw multi-line PEM text.
-
-Recommended GitHub App permissions:
-
- Repository `Metadata: Read`
- Repository `Contents: Read & Write`
- Repository `Pull requests: Read & Write`
- Repository `Checks: Read`
- Repository `Commit statuses: Read`
-
-Set the webhook URL to `https://<your-backend-host>/v1/webhooks/github` and generate a webhook secret. Store the secret as `GITHUB_WEBHOOK_SECRET`.
-
-This is required, not optional. Foundry depends on GitHub App webhook delivery for installation lifecycle changes, repo access changes, and ongoing repo / pull request sync. If the GitHub App is not installed for the workspace, or webhook delivery is misconfigured, Foundry will remain in an install / reconnect state and core GitHub-backed functionality will not work correctly.
-
-Recommended webhook subscriptions:
-
- `installation`
- `installation_repositories`
- `pull_request`
- `pull_request_review`
- `pull_request_review_comment`
- `push`
- `create`
- `delete`
- `check_suite`
- `check_run`
- `status`
-
-Use the GitHub App for:
-
- installation/reconnect state
- org repo import
- repository sync
- PR creation and updates
-
-Use GitHub OAuth for:
-
- who the user is
- which orgs they can choose
-
-## Stripe
-
-For live billing, configure:
-
-| Variable | Required | Notes |
-|---|---:|---|
-| `STRIPE_SECRET_KEY` | Yes | Server-side Stripe secret key |
-| `STRIPE_PUBLISHABLE_KEY` | Yes | Client-side Stripe publishable key |
-| `STRIPE_WEBHOOK_SECRET` | Yes | Signing secret for billing webhooks |
-| `STRIPE_PRICE_TEAM` | Yes | Stripe price id for the Team plan checkout session |
-
-Stripe should own:
-
- hosted checkout
- billing portal
- subscription status
- invoice history
- webhook-driven state sync
-
-## Mock Invariant
-
-Foundry’s mock client path should continue to work end to end even when the real auth/GitHub/Stripe path exists.
-
-That includes:
-
- sign-in
- org selection/import
- settings
- billing UI
- workspace/task/session flow
- seat accrual
-
-Use mock mode for deterministic UI review and local product development. Use the real env-backed path for integration and self-hosting.
--- a/docs/deploy/local.mdx
+++ b/docs/deploy/local.mdx
@ -9,7 +9,7 @@ For local development, run Sandbox Agent directly on your machine.

 ```bash
 # Install
-curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh

 # Run
 sandbox-agent server --no-token --host 127.0.0.1 --port 2468
@ -20,12 +20,12 @@ Or with npm/Bun:
 <Tabs>
  <Tab title="npx">
    ```bash
-    npx @sandbox-agent/cli@0.3.x server --no-token --host 127.0.0.1 --port 2468
+    npx @sandbox-agent/cli@0.4.x server --no-token --host 127.0.0.1 --port 2468
    ```
  </Tab>
  <Tab title="bunx">
    ```bash
-    bunx @sandbox-agent/cli@0.3.x server --no-token --host 127.0.0.1 --port 2468
+    bunx @sandbox-agent/cli@0.4.x server --no-token --host 127.0.0.1 --port 2468
    ```
  </Tab>
 </Tabs>
--- a/docs/deploy/modal.mdx
+++ b/docs/deploy/modal.mdx
@ -11,7 +11,7 @@ description: "Deploy Sandbox Agent inside a Modal sandbox."
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.3.x modal
+npm install sandbox-agent@0.4.x modal
 ```

 ```typescript
@ -21,9 +21,11 @@ import { modal } from "sandbox-agent/modal";
 const secrets: Record<string, string> = {};
 if (process.env.ANTHROPIC_API_KEY) secrets.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
 if (process.env.OPENAI_API_KEY) secrets.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
+const baseImage = process.env.MODAL_BASE_IMAGE ?? "node:22-slim";

 const sdk = await SandboxAgent.start({
  sandbox: modal({
+    image: baseImage,
    create: { secrets },
  }),
 });
@ -40,6 +42,7 @@ try {
 ```

 The `modal` provider handles app creation, image building, sandbox provisioning, agent installation, server startup, and tunnel networking automatically.
+Set `image` to change the base Docker image before Sandbox Agent and its agent binaries are layered on top. You can also pass a prebuilt Modal `Image` object.

 ## Faster cold starts

--- a/docs/deploy/vercel.mdx
+++ b/docs/deploy/vercel.mdx
@ -11,7 +11,7 @@ description: "Deploy Sandbox Agent inside a Vercel Sandbox."
 ## TypeScript example

 ```bash
-npm install sandbox-agent@0.3.x @vercel/sandbox
+npm install sandbox-agent@0.4.x @vercel/sandbox
 ```

 ```typescript
--- a/docs/docs.json
+++ b/docs/docs.json
@ -1,6 +1,6 @@
 {
  "$schema": "https://mintlify.com/docs.json",
-  "theme": "willow",
+  "theme": "mint",
  "name": "Sandbox Agent SDK",
  "appearance": {
    "default": "dark",
@ -8,8 +8,8 @@
  },
  "colors": {
    "primary": "#ff4f00",
-    "light": "#ff4f00",
-    "dark": "#ff4f00"
+    "light": "#ff6a2a",
+    "dark": "#cc3f00"
  },
  "favicon": "/favicon.svg",
  "logo": {
@ -25,17 +25,13 @@
  },
  "navbar": {
    "links": [
-      {
-        "label": "Gigacode",
-        "icon": "terminal",
-        "href": "https://github.com/rivet-dev/sandbox-agent/tree/main/gigacode"
-      },
      {
        "label": "Discord",
        "icon": "discord",
        "href": "https://discord.gg/auCecybynK"
      },
      {
+        "label": "GitHub",
        "type": "github",
        "href": "https://github.com/rivet-dev/sandbox-agent"
      }
@ -89,13 +85,10 @@
            "group": "System",
            "pages": ["file-system", "processes", "computer-use", "common-software"]
          },
-          {
-            "group": "Orchestration",
-            "pages": ["orchestration-architecture", "session-persistence", "observability", "multiplayer", "security"]
-          },
          {
            "group": "Reference",
            "pages": [
+              "troubleshooting",
              "architecture",
              "cli",
              "inspector",
@ -127,5 +120,11 @@
        ]
      }
    ]
+  },
+  "__removed": [
+	  {
+		"group": "Orchestration",
+		"pages": ["orchestration-architecture", "session-persistence", "observability", "multiplayer", "security"]
 	  }
+  ]
 }
--- a/docs/gigacode.mdx
+++ b/docs/gigacode.mdx
@ -1,6 +0,0 @@
---
-title: Gigacode
-url: "https://github.com/rivet-dev/sandbox-agent/tree/main/gigacode"
---
-
-
--- a/docs/openapi.json
+++ b/docs/openapi.json
@ -10,7 +10,7 @@
    "license": {
      "name": "Apache-2.0"
    },
-    "version": "0.5.0-rc.1"
+    "version": "0.4.2"
  },
  "servers": [
    {
--- a/docs/pi-support-plan.md
+++ b/docs/pi-support-plan.md
@ -1,210 +0,0 @@
-# Pi Agent Support Plan (pi-mono)
-
-## Implementation Status Update
-
- Runtime selection now supports two internal modes:
-  - `PerSession` (default for unknown/non-allowlisted Pi capabilities)
-  - `Shared` (allowlist-only compatibility path)
- Pi sessions now use per-session process isolation by default, enabling true concurrent Pi sessions in Inspector and API clients.
- Shared Pi server code remains available and is used only when capability checks allow multiplexing.
- Session termination for per-session Pi mode hard-kills the underlying Pi process and clears queued prompts/pending waiters.
- In-session concurrent sends are serialized with an unbounded daemon-side FIFO queue per session.
-
-## Investigation Summary
-
-### Pi CLI modes and RPC protocol
- Pi supports multiple modes including interactive, print/JSON output, RPC, and SDK usage. JSON mode outputs a stream of JSON events suitable for parsing, and RPC mode is intended for programmatic control over stdin/stdout.
- RPC mode is started with `pi --mode rpc` and supports options like `--provider`, `--model`, `--no-session`, and `--session-dir`.
- The RPC protocol is newline-delimited JSON over stdin/stdout:
-  - Commands are JSON objects written to stdin.
-  - Responses are JSON objects with `type: "response"` and optional `id`.
-  - Events are JSON objects without `id`.
- `prompt` can include images using `ImageContent` (base64 or URL) alongside text.
- JSON/print mode (`pi -p` or `pi --print --mode json`) produces JSONL for non-interactive parsing and can resume sessions with a token.
-
-### RPC commands
-RPC commands listed in `rpc.md` include:
- `new_session`, `get_state`, `list_sessions`, `delete_session`, `rename_session`, `clear_session`
- `prompt`, `queue_message`, `abort`, `get_queued_messages`
-
-### RPC event types
-RPC events listed in `rpc.md` include:
- `agent_start`, `agent_end`
- `turn_start`, `turn_end`
- `message_start`, `message_update`, `message_end`
- `tool_execution_start`, `tool_execution_update`, `tool_execution_end`
- `auto_compaction`, `auto_retry`, `hook_error`
-
-`message_update` uses `assistantMessageEvent` deltas such as:
- `start`, `text_start`, `text_delta`, `text_end`
- `thinking_start`, `thinking_delta`, `thinking_end`
- `toolcall_start`, `toolcall_delta`, `toolcall_end`
- `toolcall_args_start`, `toolcall_args_delta`, `toolcall_args_end`
- `done`, `error`
-
-`tool_execution_update` includes `partialResult`, which is described as accumulated output so far.
-
-### Schema source locations (pi-mono)
-RPC types are documented as living in:
- `packages/ai/src/types.ts` (Model types)
- `packages/agent/src/types.ts` (AgentResponse types)
- `packages/coding-agent/src/core/messages.ts` (message types)
- `packages/coding-agent/src/modes/rpc/rpc-types.ts` (RPC protocol types)
-
-### Distribution assets
-Pi releases provide platform-specific binaries such as:
- `pi-darwin-arm64`, `pi-darwin-x64`
- `pi-linux-arm64`, `pi-linux-x64`
- `pi-win-x64.zip`
-
-## Integration Decisions
- Follow the OpenCode pattern: a shared long-running process (stdio RPC) with session multiplexing.
- Primary integration path is RPC streaming (`pi --mode rpc`).
- JSON/print mode is a fallback only (diagnostics or non-interactive runs).
- Create sessions via `new_session`; store the returned `sessionId` as `native_session_id`.
- Use `get_state` as a re-sync path after server restarts.
- Use `prompt` for send-message, with optional image content.
- Convert Pi events into universal events; emit daemon synthetic `session.started` on session creation and `session.ended` only on errors/termination.
-
-## Implementation Plan
-
-### 1) Agent Identity + Capabilities
-Files:
- `server/packages/agent-management/src/agents.rs`
- `server/packages/sandbox-agent/src/router.rs`
- `docs/cli.mdx`, `docs/conversion.mdx`, `docs/session-transcript-schema.mdx`
- `README.md`, `frontend/packages/website/src/components/FAQ.tsx`
-
-Tasks:
- Add `AgentId::Pi` with string/binary name `"pi"` and parsing rules.
- Add Pi to `all_agents()` and agent lists.
- Define `AgentCapabilities` for Pi:
-  - `tool_calls=true`, `tool_results=true`
-  - `text_messages=true`, `streaming_deltas=true`, `item_started=true`
-  - `reasoning=true` (from `thinking_*` deltas)
-  - `images=true` (ImageContent in `prompt`)
-  - `permissions=false`, `questions=false`, `mcp_tools=false`
-  - `shared_process=true`, `session_lifecycle=false` (no native session events)
-  - `error_events=true` (hook_error)
-  - `command_execution=false`, `file_changes=false`, `file_attachments=false`
-
-### 2) Installer and Binary Resolution
-Files:
- `server/packages/agent-management/src/agents.rs`
-
-Tasks:
- Add `install_pi()` that:
-  - Downloads the correct release asset per platform (`pi-<platform>`).
-  - Handles `.zip` on Windows and raw binaries elsewhere.
-  - Marks binary executable.
- Add Pi to `AgentManager::install`, `is_installed`, `version`.
- Version detection: try `--version`, `version`, `-V`.
-
-### 3) Schema Extraction for Pi
-Files:
- `resources/agent-schemas/src/pi.ts` (new)
- `resources/agent-schemas/src/index.ts`
- `resources/agent-schemas/artifacts/json-schema/pi.json`
- `server/packages/extracted-agent-schemas/build.rs`
- `server/packages/extracted-agent-schemas/src/lib.rs`
-
-Tasks:
- Implement `extractPiSchema()`:
-  - Download pi-mono sources (zip/tarball) into a temp dir.
-  - Use `ts-json-schema-generator` against `packages/coding-agent/src/modes/rpc/rpc-types.ts`.
-  - Include dependent files per `rpc.md` (ai/types, agent/types, core/messages).
-  - Extract `RpcEvent`, `RpcResponse`, `RpcCommand` unions (exact type names from source).
- Add fallback schema if remote fetch fails (minimal union with event/response fields).
- Wire pi into extractor index and artifact generation.
-
-### 4) Universal Schema Conversion (Pi -> Universal)
-Files:
- `server/packages/universal-agent-schema/src/agents/pi.rs` (new)
- `server/packages/universal-agent-schema/src/agents/mod.rs`
- `server/packages/universal-agent-schema/src/lib.rs`
- `server/packages/sandbox-agent/src/router.rs`
-
-Mapping rules:
- `message_start` -> `item.started` (kind=message, role=assistant, native_item_id=messageId)
- `message_update`:
-  - `text_*` -> `item.delta` (assistant text delta)
-  - `thinking_*` -> `item.delta` with `ContentPart::Reasoning` (visibility=Private)
-  - `toolcall_*` and `toolcall_args_*` -> ignore for now (tool_execution_* is authoritative)
-  - `error` -> `item.completed` with `ItemStatus::Failed` (if no later message_end)
- `message_end` -> `item.completed` (finalize assistant message)
- `tool_execution_start` -> `item.started` (kind=tool_call, ContentPart::ToolCall)
- `tool_execution_update` -> `item.delta` for a synthetic tool_result item:
-  - Maintain a per-toolCallId buffer to compute delta from accumulated `partialResult`.
- `tool_execution_end` -> `item.completed` (kind=tool_result, output from `result.content`)
-  - If `isError=true`, set item status to failed.
- `agent_start`, `turn_start`, `turn_end`, `agent_end`, `auto_compaction`, `auto_retry`, `hook_error`:
-  - Map to `ItemKind::Status` with a label like `pi.agent_start`, `pi.auto_retry`, etc.
-  - Do not emit `session.ended` for these events.
- If event parsing fails, emit `agent.unparsed` (source=daemon, synthetic=true) and fail tests.
-
-### 5) Shared RPC Server Integration
-Files:
- `server/packages/sandbox-agent/src/router.rs`
-
-Tasks:
- Add a new managed stdio server type for Pi, similar to Codex:
-  - Create `PiServer` struct with:
-    - stdin sender
-    - pending request map keyed by request id
-    - per-session native session id mapping
-  - Extend `ManagedServerKind` to include Pi.
-  - Add `ensure_pi_server()` and `spawn_pi_server()` using `pi --mode rpc`.
-  - Add a `handle_pi_server_output()` loop to parse stdout lines into events/responses.
- Session creation:
-  - On `create_session`, ensure Pi server is running, send `new_session`, store sessionId.
-  - Register session with `server_manager.register_session` for native mapping.
- Sending messages:
-  - Use `prompt` command; include sessionId and optional images.
-  - Emit synthetic `item.started` only if Pi does not emit `message_start`.
-
-### 6) Router + Streaming Path Changes
-Files:
- `server/packages/sandbox-agent/src/router.rs`
-
-Tasks:
- Add Pi handling to:
-  - `create_session` (new_session)
-  - `send_message` (prompt)
-  - `parse_agent_line` (Pi event conversion)
-  - `agent_modes` (default to `default` unless Pi exposes a mode list)
-  - `agent_supports_resume` (true if Pi supports session resume)
-
-### 7) Tests
-Files:
- `server/packages/sandbox-agent/tests/...`
- `server/packages/universal-agent-schema/tests/...` (if present)
-
-Tasks:
- Unit tests for conversion:
-  - `message_start/update/end` -> item.started/delta/completed
-  - `tool_execution_*` -> tool call/result mapping with partialResult delta
-  - failure -> agent.unparsed
- Integration tests:
-  - Start Pi RPC server, create session, send prompt, stream events.
-  - Validate `native_session_id` mapping and event ordering.
- Update HTTP/SSE test coverage to include Pi agent if relevant.
-
-## Risk Areas / Edge Cases
- `tool_execution_update.partialResult` is cumulative; must compute deltas.
- `message_update` may emit `done`/`error` without `message_end`; handle both paths.
- No native session lifecycle events; rely on daemon synthetic events.
- Session recovery after RPC server restart requires `get_state` + re-register sessions.
-
-## Acceptance Criteria
- Pi appears in `/v1/agents`, CLI list, and docs.
- `create_session` returns `native_session_id` from Pi `new_session`.
- Streaming prompt yields universal events with proper ordering:
-  - message -> item.started/delta/completed
-  - tool execution -> tool call + tool result
- Tests pass and no synthetic data is used in test fixtures.
-
-## Sources
- https://upd.dev/badlogic/pi-mono/src/commit/d36e0ea07303d8a76d51b4a7bd5f0d6d3c490860/packages/coding-agent/docs/rpc.md
- https://buildwithpi.ai/pi-cli
- https://takopi.dev/docs/pi-cli/
- https://upd.dev/badlogic/pi-mono/releases
--- a/docs/quickstart.mdx
+++ b/docs/quickstart.mdx
@ -64,7 +64,7 @@ icon: "rocket"
        docker run -p 2468:2468 \
          -e ANTHROPIC_API_KEY="sk-ant-..." \
          -e OPENAI_API_KEY="sk-..." \
-          rivetdev/sandbox-agent:0.5.0-rc.1-full \
+          rivetdev/sandbox-agent:0.4.2-full \
          server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>
@ -89,7 +89,7 @@ icon: "rocket"
        Install and run the binary directly.

        ```bash
-        curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+        curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
        sandbox-agent server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>
@ -98,7 +98,7 @@ icon: "rocket"
        Run without installing globally.

        ```bash
-        npx @sandbox-agent/cli@0.3.x server --no-token --host 0.0.0.0 --port 2468
+        npx @sandbox-agent/cli@0.4.x server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>

@ -106,7 +106,7 @@ icon: "rocket"
        Run without installing globally.

        ```bash
-        bunx @sandbox-agent/cli@0.3.x server --no-token --host 0.0.0.0 --port 2468
+        bunx @sandbox-agent/cli@0.4.x server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>

@ -114,7 +114,7 @@ icon: "rocket"
        Install globally, then run.

        ```bash
-        npm install -g @sandbox-agent/cli@0.3.x
+        npm install -g @sandbox-agent/cli@0.4.x
        sandbox-agent server --no-token --host 0.0.0.0 --port 2468
        ```
      </Tab>
@ -123,7 +123,7 @@ icon: "rocket"
        Install globally, then run.

        ```bash
-        bun add -g @sandbox-agent/cli@0.3.x
+        bun add -g @sandbox-agent/cli@0.4.x
        # Allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
        bun pm -g trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
        sandbox-agent server --no-token --host 0.0.0.0 --port 2468
@ -134,7 +134,7 @@ icon: "rocket"
        For local development, use `SandboxAgent.start()` to spawn and manage the server as a subprocess.

        ```bash
-        npm install sandbox-agent@0.3.x
+        npm install sandbox-agent@0.4.x
        ```

        ```typescript
@ -148,7 +148,7 @@ icon: "rocket"
        For local development, use `SandboxAgent.start()` to spawn and manage the server as a subprocess.

        ```bash
-        bun add sandbox-agent@0.3.x
+        bun add sandbox-agent@0.4.x
        # Allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
        bun pm trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
        ```
--- a/docs/react-components.mdx
+++ b/docs/react-components.mdx
@ -17,7 +17,7 @@ Current exports:
 ## Install

 ```bash
-npm install @sandbox-agent/react@0.3.x
+npm install @sandbox-agent/react@0.4.x
 ```

 ## Full example
--- a/docs/sdk-overview.mdx
+++ b/docs/sdk-overview.mdx
@ -11,12 +11,12 @@ The TypeScript SDK is centered on `sandbox-agent` and its `SandboxAgent` class.
 <Tabs>
  <Tab title="npm">
    ```bash
-    npm install sandbox-agent@0.3.x
+    npm install sandbox-agent@0.4.x
    ```
  </Tab>
  <Tab title="bun">
    ```bash
-    bun add sandbox-agent@0.3.x
+    bun add sandbox-agent@0.4.x
    # Allow Bun to run postinstall scripts for native binaries (required for SandboxAgent.start()).
    bun pm trust @sandbox-agent/cli-linux-x64 @sandbox-agent/cli-linux-arm64 @sandbox-agent/cli-darwin-arm64 @sandbox-agent/cli-darwin-x64 @sandbox-agent/cli-win32-x64
    ```
@ -26,7 +26,7 @@ The TypeScript SDK is centered on `sandbox-agent` and its `SandboxAgent` class.
 ## Optional React components

 ```bash
-npm install @sandbox-agent/react@0.3.x
+npm install @sandbox-agent/react@0.4.x
 ```

 ## Create a client
--- a/docs/session-transcript-schema.mdx
+++ b/docs/session-transcript-schema.mdx
@ -1,388 +0,0 @@
---
-title: "Session Transcript Schema"
-description: "Universal event schema for session transcripts across all agents."
---
-
-Each coding agent outputs events in its own native format. The sandbox-agent converts these into a universal event schema, giving you a consistent session transcript regardless of which agent you use.
-
-The schema is defined in [OpenAPI format](https://github.com/rivet-dev/sandbox-agent/blob/main/docs/openapi.json). See the [HTTP API Reference](/api-reference) for endpoint documentation.
-
-## Coverage Matrix
-
-This table shows which agent feature coverage appears in the universal event stream. All agents retain their full native feature coverage—this only reflects what's normalized into the schema.
-
-| Feature            | Claude | Codex | OpenCode     | Amp          | Pi (RPC)     |
-|--------------------|:------:|:-----:|:------------:|:------------:|:------------:|
-| Stability          | Stable | Stable| Experimental | Experimental | Experimental |
-| Text Messages      |   ✓    |   ✓   |      ✓       |      ✓       |      ✓       |
-| Tool Calls         |   ✓    |   ✓   |      ✓       |      ✓       |      ✓       |
-| Tool Results       |   ✓    |   ✓   |      ✓       |      ✓       |      ✓       |
-| Questions (HITL)   |   ✓    |       |      ✓       |              |              |
-| Permissions (HITL) |   ✓    |   ✓   |      ✓       |      -       |              |
-| Images             |   -    |   ✓   |      ✓       |      -       |      ✓       |
-| File Attachments   |   -    |   ✓   |      ✓       |      -       |              |
-| Session Lifecycle  |   -    |   ✓   |      ✓       |      -       |              |
-| Error Events       |   -    |   ✓   |      ✓       |      ✓       |      ✓       |
-| Reasoning/Thinking |   -    |   ✓   |      -       |      -       |      ✓       |
-| Command Execution  |   -    |   ✓   |      -       |      -       |              |
-| File Changes       |   -    |   ✓   |      -       |      -       |              |
-| MCP Tools          |   ✓    |   ✓   |      ✓       |      ✓       |              |
-| Streaming Deltas   |   ✓    |   ✓   |      ✓       |      -       |      ✓       |
-| Variants           |        |   ✓   |      ✓       |      ✓       |      ✓       |
-
-Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview) · [Codex](https://github.com/openai/codex) · [OpenCode](https://github.com/opencode-ai/opencode) · [Amp](https://ampcode.com) · [Pi](https://buildwithpi.ai/pi-cli)
-
- ✓ = Appears in session events
- \- = Agent supports natively, schema conversion coming soon
- (blank) = Not supported by agent
- Pi runtime model is router-managed per-session RPC (`pi --mode rpc`); it does not use generic subprocess streaming.
-
-<AccordionGroup>
-  <Accordion title="Text Messages">
-    Basic message exchange between user and assistant.
-  </Accordion>
-  <Accordion title="Tool Calls & Results">
-    Visibility into tool invocations (file reads, command execution, etc.) and their results. When not natively supported, tool activity is embedded in message content.
-  </Accordion>
-  <Accordion title="Questions (HITL)">
-    Interactive questions the agent asks the user. Emits `question.requested` and `question.resolved` events.
-  </Accordion>
-  <Accordion title="Permissions (HITL)">
-    Permission requests for sensitive operations. Emits `permission.requested` and `permission.resolved` events.
-  </Accordion>
-  <Accordion title="Images">
-    Support for image attachments in messages.
-  </Accordion>
-  <Accordion title="File Attachments">
-    Support for file attachments in messages.
-  </Accordion>
-  <Accordion title="Session Lifecycle">
-    Native `session.started` and `session.ended` events. When not supported, the daemon emits synthetic lifecycle events.
-  </Accordion>
-  <Accordion title="Error Events">
-    Structured error events for runtime failures.
-  </Accordion>
-  <Accordion title="Reasoning/Thinking">
-    Extended thinking or reasoning content with visibility controls.
-  </Accordion>
-  <Accordion title="Command Execution">
-    Detailed command execution events with stdout/stderr.
-  </Accordion>
-  <Accordion title="File Changes">
-    Structured file modification events with diffs.
-  </Accordion>
-  <Accordion title="MCP Tools">
-    Model Context Protocol tool support.
-  </Accordion>
-  <Accordion title="Streaming Deltas">
-    Native streaming of content deltas. When not supported, the daemon emits a single synthetic delta before `item.completed`.
-  </Accordion>
-  <Accordion title="Variants">
-    Model variants such as reasoning effort or depth. Agents may expose different variant sets per model.
-  </Accordion>
-</AccordionGroup>
-
-Want support for another agent? [Open an issue](https://github.com/rivet-dev/sandbox-agent/issues/new) to request it.
-
-## UniversalEvent
-
-Every event from the API is wrapped in a `UniversalEvent` envelope.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `event_id` | string | Unique identifier for this event |
-| `sequence` | integer | Monotonic sequence number within the session (starts at 1) |
-| `time` | string | RFC3339 timestamp |
-| `session_id` | string | Daemon-generated session identifier |
-| `native_session_id` | string? | Provider-native session/thread identifier (e.g., Codex `threadId`, OpenCode `sessionID`) |
-| `source` | string | Event origin: `agent` (native) or `daemon` (synthetic) |
-| `synthetic` | boolean | Whether this event was generated by the daemon to fill gaps |
-| `type` | string | Event type (see [Event Types](#event-types)) |
-| `data` | object | Event-specific payload |
-| `raw` | any? | Original provider payload (only when `include_raw=true`) |
-
-```json
-{
-  "event_id": "evt_abc123",
-  "sequence": 1,
-  "time": "2025-01-28T12:00:00Z",
-  "session_id": "my-session",
-  "native_session_id": "thread_xyz",
-  "source": "agent",
-  "synthetic": false,
-  "type": "item.completed",
-  "data": { ... }
-}
-```
-
-## Event Types
-
-### Session Lifecycle
-
-| Type | Description | Data |
-|------|-------------|------|
-| `session.started` | Session has started | `{ metadata?: any }` |
-| `session.ended` | Session has ended | `{ reason, terminated_by, message?, exit_code? }` |
-
-### Turn Lifecycle
-
-| Type | Description | Data |
-|------|-------------|------|
-| `turn.started` | Turn has started | `{ phase: "started", turn_id?, metadata? }` |
-| `turn.ended` | Turn has ended | `{ phase: "ended", turn_id?, metadata? }` |
-
-**SessionEndedData**
-
-| Field | Type | Values |
-|-------|------|--------|
-| `reason` | string | `completed`, `error`, `terminated` |
-| `terminated_by` | string | `agent`, `daemon` |
-| `message` | string? | Error message (only present when reason is `error`) |
-| `exit_code` | int? | Process exit code (only present when reason is `error`) |
-| `stderr` | StderrOutput? | Structured stderr output (only present when reason is `error`) |
-
-**StderrOutput**
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `head` | string? | First 20 lines of stderr (if truncated) or full stderr (if not truncated) |
-| `tail` | string? | Last 50 lines of stderr (only present if truncated) |
-| `truncated` | boolean | Whether the output was truncated |
-| `total_lines` | int? | Total number of lines in stderr |
-
-### Item Lifecycle
-
-| Type | Description | Data |
-|------|-------------|------|
-| `item.started` | Item creation | `{ item }` |
-| `item.delta` | Streaming content delta | `{ item_id, native_item_id?, delta }` |
-| `item.completed` | Item finalized | `{ item }` |
-
-Items follow a consistent lifecycle: `item.started` → `item.delta` (0 or more) → `item.completed`.
-
-### HITL (Human-in-the-Loop)
-
-| Type | Description | Data |
-|------|-------------|------|
-| `permission.requested` | Permission request pending | `{ permission_id, action, status, metadata? }` |
-| `permission.resolved` | Permission decision recorded | `{ permission_id, action, status, metadata? }` |
-| `question.requested` | Question pending user input | `{ question_id, prompt, options, status }` |
-| `question.resolved` | Question answered or rejected | `{ question_id, prompt, options, status, response? }` |
-
-**PermissionEventData**
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `permission_id` | string | Identifier for the permission request |
-| `action` | string | What the agent wants to do |
-| `status` | string | `requested`, `accept`, `accept_for_session`, `reject` |
-| `metadata` | any? | Additional context |
-
-**QuestionEventData**
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `question_id` | string | Identifier for the question |
-| `prompt` | string | Question text |
-| `options` | string[] | Available answer options |
-| `status` | string | `requested`, `answered`, `rejected` |
-| `response` | string? | Selected answer (when resolved) |
-
-### Errors
-
-| Type | Description | Data |
-|------|-------------|------|
-| `error` | Runtime error | `{ message, code?, details? }` |
-| `agent.unparsed` | Parse failure | `{ error, location, raw_hash? }` |
-
-The `agent.unparsed` event indicates the daemon failed to parse an agent payload. This should be treated as a bug.
-
-## UniversalItem
-
-Items represent discrete units of content within a session.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `item_id` | string | Daemon-generated identifier |
-| `native_item_id` | string? | Provider-native item/message identifier |
-| `parent_id` | string? | Parent item ID (e.g., tool call/result parented to a message) |
-| `kind` | string | Item category (see below) |
-| `role` | string? | Actor role for message items |
-| `status` | string | Lifecycle status |
-| `content` | ContentPart[] | Ordered list of content parts |
-
-### ItemKind
-
-| Value | Description |
-|-------|-------------|
-| `message` | User or assistant message |
-| `tool_call` | Tool invocation |
-| `tool_result` | Tool execution result |
-| `system` | System message |
-| `status` | Status update |
-| `unknown` | Unrecognized item type |
-
-### ItemRole
-
-| Value | Description |
-|-------|-------------|
-| `user` | User message |
-| `assistant` | Assistant response |
-| `system` | System prompt |
-| `tool` | Tool-related message |
-
-### ItemStatus
-
-| Value | Description |
-|-------|-------------|
-| `in_progress` | Item is streaming or pending |
-| `completed` | Item is finalized |
-| `failed` | Item execution failed |
-
-## Content Parts
-
-The `content` array contains typed parts that make up an item's payload.
-
-### text
-
-Plain text content.
-
-```json
-{ "type": "text", "text": "Hello, world!" }
-```
-
-### json
-
-Structured JSON content.
-
-```json
-{ "type": "json", "json": { "key": "value" } }
-```
-
-### tool_call
-
-Tool invocation.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `name` | string | Tool name |
-| `arguments` | string | JSON-encoded arguments |
-| `call_id` | string | Unique call identifier |
-
-```json
-{
-  "type": "tool_call",
-  "name": "read_file",
-  "arguments": "{\"path\": \"/src/main.ts\"}",
-  "call_id": "call_abc123"
-}
-```
-
-### tool_result
-
-Tool execution result.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `call_id` | string | Matching call identifier |
-| `output` | string | Tool output |
-
-```json
-{
-  "type": "tool_result",
-  "call_id": "call_abc123",
-  "output": "File contents here..."
-}
-```
-
-### file_ref
-
-File reference with optional diff.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `path` | string | File path |
-| `action` | string | `read`, `write`, `patch` |
-| `diff` | string? | Unified diff (for patches) |
-
-```json
-{
-  "type": "file_ref",
-  "path": "/src/main.ts",
-  "action": "write",
-  "diff": "@@ -1,3 +1,4 @@\n+import { foo } from 'bar';"
-}
-```
-
-### image
-
-Image reference.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `path` | string | Image file path |
-| `mime` | string? | MIME type |
-
-```json
-{ "type": "image", "path": "/tmp/screenshot.png", "mime": "image/png" }
-```
-
-### reasoning
-
-Model reasoning/thinking content.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `text` | string | Reasoning text |
-| `visibility` | string | `public` or `private` |
-
-```json
-{ "type": "reasoning", "text": "Let me think about this...", "visibility": "public" }
-```
-
-### status
-
-Status indicator.
-
-| Field | Type | Description |
-|-------|------|-------------|
-| `label` | string | Status label |
-| `detail` | string? | Additional detail |
-
-```json
-{ "type": "status", "label": "Running tests", "detail": "3 of 10 passed" }
-```
-
-## Source & Synthetics
-
-### EventSource
-
-The `source` field indicates who emitted the event:
-
-| Value | Description |
-|-------|-------------|
-| `agent` | Native event from the agent |
-| `daemon` | Synthetic event generated by the daemon |
-
-### Synthetic Events
-
-The daemon emits synthetic events (`synthetic: true`, `source: "daemon"`) to provide a consistent event stream across all agents. Common synthetics:
-
-| Synthetic | When |
-|-----------|------|
-| `session.started` | Agent doesn't emit explicit session start |
-| `session.ended` | Agent doesn't emit explicit session end |
-| `turn.started` | Agent doesn't emit explicit turn start |
-| `turn.ended` | Agent doesn't emit explicit turn end |
-| `item.started` | Agent doesn't emit item start events |
-| `item.delta` | Agent doesn't stream deltas natively |
-| `question.*` | Claude Code plan mode (from ExitPlanMode tool) |
-
-### Raw Payloads
-
-Pass `include_raw=true` to event endpoints to receive the original agent payload in the `raw` field. Useful for debugging or accessing agent-specific data not in the universal schema.
-
-```typescript
-const events = await client.getEvents("my-session", { includeRaw: true });
-// events[0].raw contains the original agent payload
-```
--- a/docs/theme.css
+++ b/docs/theme.css
@ -20,7 +20,6 @@ body {
  color: var(--sa-text);
 }

-/*
 a {
  color: var(--sa-primary);
 }
@ -41,6 +40,13 @@ select {
  color: var(--sa-text);
 }

+code,
+pre {
+  background-color: var(--sa-card);
+  border: 1px solid var(--sa-border);
+  color: var(--sa-text);
+}
+
 .card,
 .mintlify-card,
 .docs-card {
@ -64,4 +70,3 @@ select {
 .alert-danger {
  border-color: var(--sa-danger);
 }
-*/
--- a/docs/troubleshooting.mdx
+++ b/docs/troubleshooting.mdx
@ -29,25 +29,6 @@ Verify the agent is installed:
 ls -la ~/.local/share/sandbox-agent/bin/
 ```

-### 4. Binary libc mismatch (musl vs glibc)
-
-Claude Code binaries are available in both musl and glibc variants. If you see errors like:
-
-```
-cannot execute: required file not found
-Error loading shared library libstdc++.so.6: No such file or directory
-```
-
-This means the wrong binary variant was downloaded.
-
-**For sandbox-agent 0.2.0+**: Platform detection is automatic. The correct binary (musl or glibc) is downloaded based on the runtime environment.
-
-**For sandbox-agent 0.1.x**: Use Alpine Linux which has native musl support:
-
-```dockerfile
-FROM alpine:latest
-RUN apk add --no-cache curl ca-certificates libstdc++ libgcc bash
-```

 ## Daytona Network Restrictions

--- a/examples/boxlite-python/Dockerfile
+++ b/examples/boxlite-python/Dockerfile
@ -1,5 +1,5 @@
 FROM node:22-bookworm-slim
 RUN apt-get update && apt-get install -y curl ca-certificates && rm -rf /var/lib/apt/lists/*
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
 RUN sandbox-agent install-agent claude
 RUN sandbox-agent install-agent codex
--- a/examples/boxlite/Dockerfile
+++ b/examples/boxlite/Dockerfile
@ -1,5 +1,5 @@
 FROM node:22-bookworm-slim
 RUN apt-get update && apt-get install -y curl ca-certificates && rm -rf /var/lib/apt/lists/*
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh
 RUN sandbox-agent install-agent claude
 RUN sandbox-agent install-agent codex
--- a/examples/boxlite/tsconfig.json
+++ b/examples/boxlite/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/cloudflare/Dockerfile
+++ b/examples/cloudflare/Dockerfile
@ -1,7 +1,7 @@
 FROM cloudflare/sandbox:0.7.0

 # Install sandbox-agent
-RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh
+RUN curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh

 # Pre-install agents
 RUN sandbox-agent install-agent claude && \
--- a/examples/computesdk/tsconfig.json
+++ b/examples/computesdk/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/daytona/src/index.ts
+++ b/examples/daytona/src/index.ts
@ -16,7 +16,6 @@ console.log(`UI: ${client.inspectorUrl}`);

 const session = await client.createSession({
  agent: detectAgent(),
-  cwd: "/home/daytona",
 });

 session.onEvent((event) => {
--- a/examples/daytona/tsconfig.json
+++ b/examples/daytona/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/docker/tsconfig.json
+++ b/examples/docker/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/e2b/src/e2b.ts
+++ b/examples/e2b/src/e2b.ts
@ -17,8 +17,10 @@ export async function setupE2BSandboxAgent(): Promise<{
  token?: string;
  cleanup: () => Promise<void>;
 }> {
+  const template = process.env.E2B_TEMPLATE;
  const client = await SandboxAgent.start({
    sandbox: e2b({
+      template,
      create: { envs: collectEnvVars() },
    }),
  });
--- a/examples/e2b/src/index.ts
+++ b/examples/e2b/src/index.ts
@ -5,15 +5,15 @@ import { detectAgent } from "@sandbox-agent/example-shared";
 const envs: Record<string, string> = {};
 if (process.env.ANTHROPIC_API_KEY) envs.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
 if (process.env.OPENAI_API_KEY) envs.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
+const template = process.env.E2B_TEMPLATE;

 const client = await SandboxAgent.start({
  // ✨ NEW ✨
-  sandbox: e2b({ create: { envs } }),
+  sandbox: e2b({ template, create: { envs } }),
 });

 const session = await client.createSession({
  agent: detectAgent(),
-  cwd: "/home/user",
 });

 session.onEvent((event) => {
--- a/examples/e2b/tsconfig.json
+++ b/examples/e2b/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/file-system/tsconfig.json
+++ b/examples/file-system/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/mcp-custom-tool/tsconfig.json
+++ b/examples/mcp-custom-tool/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/mcp/tsconfig.json
+++ b/examples/mcp/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/modal/tsconfig.json
+++ b/examples/modal/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/permissions/tsconfig.json
+++ b/examples/permissions/tsconfig.json
@ -1,7 +1,8 @@
 {
  "compilerOptions": {
    "target": "ES2022",
-    "lib": ["ES2022"],
+    "lib": ["ES2022", "DOM"],
+    "types": ["node"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
--- a/examples/persist-memory/tsconfig.json
+++ b/examples/persist-memory/tsconfig.json
@ -1,13 +1,15 @@
 {
  "compilerOptions": {
    "target": "ES2022",
+    "lib": ["ES2022", "DOM"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
    "noEmit": true,
    "esModuleInterop": true,
    "strict": true,
-    "skipLibCheck": true
+    "skipLibCheck": true,
+    "types": ["node"]
  },
  "include": ["src"]
 }
--- a/examples/persist-postgres/tsconfig.json
+++ b/examples/persist-postgres/tsconfig.json
@ -1,13 +1,15 @@
 {
  "compilerOptions": {
    "target": "ES2022",
+    "lib": ["ES2022", "DOM"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
    "noEmit": true,
    "esModuleInterop": true,
    "strict": true,
-    "skipLibCheck": true
+    "skipLibCheck": true,
+    "types": ["node"]
  },
  "include": ["src"]
 }
--- a/examples/persist-sqlite/tsconfig.json
+++ b/examples/persist-sqlite/tsconfig.json
@ -1,13 +1,15 @@
 {
  "compilerOptions": {
    "target": "ES2022",
+    "lib": ["ES2022", "DOM"],
    "module": "ESNext",
    "moduleResolution": "Bundler",
    "allowImportingTsExtensions": true,
    "noEmit": true,
    "esModuleInterop": true,
    "strict": true,
-    "skipLibCheck": true
+    "skipLibCheck": true,
+    "types": ["node"]
  },
  "include": ["src"]
 }
--- a/examples/shared/src/docker.ts
+++ b/examples/shared/src/docker.ts
@ -9,7 +9,7 @@ const __dirname = path.dirname(fileURLToPath(import.meta.url));
 const REPO_ROOT = path.resolve(__dirname, "..", "..", "..");

 /** Pre-built Docker image with all agents installed. */
-export const FULL_IMAGE = "rivetdev/sandbox-agent:0.5.0-rc.1-full";
+export const FULL_IMAGE = "rivetdev/sandbox-agent:0.4.2-full";

 export interface DockerSandboxOptions {
  /** Container port used by sandbox-agent inside Docker. */
--- a/examples/skills-custom-tool/tsconfig.json
+++ b/examples/skills-custom-tool/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/skills/tsconfig.json
+++ b/examples/skills/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/examples/sprites/package.json
+++ b/examples/sprites/package.json
@ -0,0 +1,20 @@
+{
+  "name": "@sandbox-agent/example-sprites",
+  "private": true,
+  "type": "module",
+  "scripts": {
+    "start": "tsx src/index.ts",
+    "typecheck": "tsc --noEmit"
+  },
+  "dependencies": {
+    "@fly/sprites": "latest",
+    "@sandbox-agent/example-shared": "workspace:*",
+    "sandbox-agent": "workspace:*"
+  },
+  "devDependencies": {
+    "@types/node": "latest",
+    "tsx": "latest",
+    "typescript": "latest",
+    "vitest": "^3.0.0"
+  }
+}
--- a/examples/sprites/src/index.ts
+++ b/examples/sprites/src/index.ts
@ -0,0 +1,21 @@
+import { SandboxAgent } from "sandbox-agent";
+import { sprites } from "sandbox-agent/sprites";
+
+const env: Record<string, string> = {};
+if (process.env.ANTHROPIC_API_KEY) env.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
+if (process.env.OPENAI_API_KEY) env.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
+
+const client = await SandboxAgent.start({
+  sandbox: sprites({
+    token: process.env.SPRITES_API_KEY ?? process.env.SPRITE_TOKEN ?? process.env.SPRITES_TOKEN,
+    env,
+  }),
+});
+
+console.log(`UI: ${client.inspectorUrl}`);
+console.log(await client.getHealth());
+
+process.once("SIGINT", async () => {
+  await client.destroySandbox();
+  process.exit(0);
+});
--- a/examples/sprites/tests/sprites.test.ts
+++ b/examples/sprites/tests/sprites.test.ts
@ -0,0 +1,34 @@
+import { describe, it, expect } from "vitest";
+import { SandboxAgent } from "sandbox-agent";
+import { sprites } from "sandbox-agent/sprites";
+
+const shouldRun = Boolean(process.env.SPRITES_API_KEY || process.env.SPRITE_TOKEN || process.env.SPRITES_TOKEN);
+const timeoutMs = Number.parseInt(process.env.SANDBOX_TEST_TIMEOUT_MS || "", 10) || 300_000;
+
+const testFn = shouldRun ? it : it.skip;
+
+describe("sprites provider", () => {
+  testFn(
+    "starts sandbox-agent and responds to /v1/health",
+    async () => {
+      const env: Record<string, string> = {};
+      if (process.env.ANTHROPIC_API_KEY) env.ANTHROPIC_API_KEY = process.env.ANTHROPIC_API_KEY;
+      if (process.env.OPENAI_API_KEY) env.OPENAI_API_KEY = process.env.OPENAI_API_KEY;
+
+      const sdk = await SandboxAgent.start({
+        sandbox: sprites({
+          token: process.env.SPRITES_API_KEY ?? process.env.SPRITE_TOKEN ?? process.env.SPRITES_TOKEN,
+          env,
+        }),
+      });
+
+      try {
+        const health = await sdk.getHealth();
+        expect(health.status).toBe("ok");
+      } finally {
+        await sdk.destroySandbox();
+      }
+    },
+    timeoutMs,
+  );
+});
--- a/examples/sprites/tsconfig.json
+++ b/examples/sprites/tsconfig.json
@ -0,0 +1,17 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "lib": ["ES2022", "DOM"],
+    "module": "ESNext",
+    "moduleResolution": "Bundler",
+    "allowImportingTsExtensions": true,
+    "noEmit": true,
+    "esModuleInterop": true,
+    "strict": true,
+    "skipLibCheck": true,
+    "resolveJsonModule": true,
+    "types": ["node"]
+  },
+  "include": ["src/**/*"],
+  "exclude": ["node_modules", "**/*.test.ts"]
+}
--- a/examples/vercel/src/index.ts
+++ b/examples/vercel/src/index.ts
@ -19,7 +19,6 @@ console.log(`UI: ${client.inspectorUrl}`);

 const session = await client.createSession({
  agent: detectAgent(),
-  cwd: "/home/vercel-sandbox",
 });

 session.onEvent((event) => {
--- a/examples/vercel/tsconfig.json
+++ b/examples/vercel/tsconfig.json
@ -9,7 +9,8 @@
    "esModuleInterop": true,
    "strict": true,
    "skipLibCheck": true,
-    "resolveJsonModule": true
+    "resolveJsonModule": true,
+    "types": ["node"]
  },
  "include": ["src/**/*"],
  "exclude": ["node_modules", "**/*.test.ts"]
--- a/foundry/CLAUDE.md
+++ b/foundry/CLAUDE.md
@ -72,6 +72,26 @@ Local Docker sandboxes use the `rivetdev/sandbox-agent:foundry-base-latest` imag
 - The image must be built with `--platform linux/amd64`. The Rust build is memory-intensive; Docker Desktop needs at least 8GB RAM allocated.
 - When updating the base image contents (new system packages, agent versions), rebuild and push with the publish script, then update the `foundry-base-latest` tag.

+## Production GitHub App + OAuth App
+
+Foundry uses two separate GitHub entities in production:
+
+- **OAuth App** (`GITHUB_CLIENT_ID` / `GITHUB_CLIENT_SECRET`) — handles "Sign in with GitHub" via Better Auth. This is a standard OAuth App.
+- **GitHub App** (`GITHUB_APP_ID` / `GITHUB_APP_CLIENT_ID` / `GITHUB_APP_CLIENT_SECRET` / `GITHUB_APP_PRIVATE_KEY`) — handles webhooks, installation tokens for repo access, and GitHub API sync (repos, PRs). Must be manually installed on each org.
+
+Key env vars and where they connect:
+
+- `GITHUB_REDIRECT_URI` — OAuth callback, must point to `https://api.sandboxagent.dev/v1/auth/callback/github`
+- `GITHUB_WEBHOOK_SECRET` — must match the secret configured on the GitHub App's Webhook settings page exactly. Mismatches cause silent 500s on webhook delivery (signature verification fails inside the actor, surfaced as a generic RivetKit `internal_error`).
+- `BETTER_AUTH_URL` — must be the **API** URL (`https://api.sandboxagent.dev`), not the frontend URL. Better Auth uses this internally for sign-out and session management calls.
+- `APP_URL` — the **frontend** URL (`https://foundry.sandboxagent.dev`).
+
+Troubleshooting:
+
+- **"GitHub App not installed"** — The GitHub App must be manually installed on each org. Sign-in does not auto-install it. Go to the GitHub App settings → Install App tab. The sign-in flow can only detect existing installations, not create them.
+- **Webhooks not arriving** — Check the GitHub App → Advanced tab for delivery history. If deliveries show 500, the webhook secret likely doesn't match `GITHUB_WEBHOOK_SECRET`. Test with: `echo -n '{"test":true}' | openssl dgst -sha256 -hmac "$SECRET"` and curl the endpoint with the computed signature.
+- **Deleting all actors wipes GitHub App installation state.** After a full actor reset, you must trigger a webhook (e.g. redeliver from GitHub App Advanced tab, or re-install the app) to repopulate installation records.
+
 ## Railway Logs

 - Production Foundry Railway logs can be read from a linked checkout with `railway logs --deployment --lines 200` or `railway logs <deployment-id> --deployment --lines 200`.
--- a/foundry/docker/backend.Dockerfile
+++ b/foundry/docker/backend.Dockerfile
@ -19,6 +19,7 @@ RUN pnpm --filter @sandbox-agent/foundry-backend deploy --prod /out
 FROM oven/bun:1.2 AS runtime
 ENV NODE_ENV=production
 ENV HOME=/home/task
+ENV RIVET_RUNNER_VERSION_FILE=/etc/foundry/rivet-runner-version
 WORKDIR /app
 RUN apt-get update \
  && apt-get install -y --no-install-recommends \
@ -31,6 +32,8 @@ RUN addgroup --system --gid 1001 task \
  && adduser --system --uid 1001 --home /home/task --ingroup task task \
  && mkdir -p /home/task \
  && chown -R task:task /home/task /app
+RUN mkdir -p /etc/foundry \
+  && date +%s > /etc/foundry/rivet-runner-version
 COPY --from=build /out ./
 USER task
 EXPOSE 7741
--- a/foundry/docker/backend.dev.Dockerfile
+++ b/foundry/docker/backend.dev.Dockerfile
@ -21,6 +21,9 @@ RUN curl -fsSL "https://releases.rivet.dev/sandbox-agent/${SANDBOX_AGENT_VERSION

 ENV PATH="/root/.local/bin:${PATH}"
 ENV SANDBOX_AGENT_BIN="/root/.local/bin/sandbox-agent"
+ENV RIVET_RUNNER_VERSION_FILE=/etc/foundry/rivet-runner-version
+RUN mkdir -p /etc/foundry \
+  && date +%s > /etc/foundry/rivet-runner-version

 WORKDIR /app

--- a/foundry/docker/backend.preview.Dockerfile
+++ b/foundry/docker/backend.preview.Dockerfile
@ -20,6 +20,9 @@ RUN curl -fsSL "https://releases.rivet.dev/sandbox-agent/${SANDBOX_AGENT_VERSION

 ENV PATH="/root/.local/bin:${PATH}"
 ENV SANDBOX_AGENT_BIN="/root/.local/bin/sandbox-agent"
+ENV RIVET_RUNNER_VERSION_FILE=/etc/foundry/rivet-runner-version
+RUN mkdir -p /etc/foundry \
+  && date +%s > /etc/foundry/rivet-runner-version

 WORKDIR /workspace/quebec

--- a/foundry/packages/backend/src/actors/index.ts
+++ b/foundry/packages/backend/src/actors/index.ts
@ -6,16 +6,15 @@ import { auditLog } from "./audit-log/index.js";
 import { taskSandbox } from "./sandbox/index.js";
 import { organization } from "./organization/index.js";
 import { logger } from "../logging.js";
+import { resolveRunnerVersion } from "../config/runner-version.js";

-const RUNNER_VERSION = Math.floor(Date.now() / 1000);
+const runnerVersion = resolveRunnerVersion();

 export const registry = setup({
  serverless: {
    basePath: "/v1/rivet",
  },
-  runner: {
-    version: RUNNER_VERSION,
-  },
+  runner: { version: runnerVersion },
  logging: {
    baseLogger: logger,
  },
--- a/foundry/packages/backend/src/actors/logging.ts
+++ b/foundry/packages/backend/src/actors/logging.ts
@ -22,6 +22,16 @@ export function resolveErrorStack(error: unknown): string | undefined {
  return undefined;
 }

+export function logActorInfo(scope: string, message: string, context?: Record<string, unknown>): void {
+  logger.info(
+    {
+      scope,
+      ...(context ?? {}),
+    },
+    message,
+  );
+}
+
 export function logActorWarning(scope: string, message: string, context?: Record<string, unknown>): void {
  logger.warn(
    {
--- a/foundry/packages/backend/src/actors/sandbox/index.ts
+++ b/foundry/packages/backend/src/actors/sandbox/index.ts
@ -13,7 +13,12 @@ import { logActorWarning, resolveErrorMessage } from "../logging.js";
 import { expectQueueResponse } from "../../services/queue.js";
 import { resolveSandboxProviderId } from "../../sandbox-config.js";

-const SANDBOX_REPO_CWD = "/home/sandbox/repo";
+/**
+ * Default repo CWD inside the sandbox. The actual path is resolved dynamically
+ * via `$HOME/repo` because different sandbox providers run as different users
+ * (e.g. E2B uses `/home/user`, local Docker uses `/home/sandbox`).
+ */
+const DEFAULT_SANDBOX_REPO_CWD = "/home/user/repo";
 const DEFAULT_LOCAL_SANDBOX_IMAGE = "rivetdev/sandbox-agent:foundry-base-latest";
 const DEFAULT_LOCAL_SANDBOX_PORT = 2468;
 const dockerClient = new Dockerode({ socketPath: "/var/run/docker.sock" });
@ -207,7 +212,7 @@ const baseTaskSandbox = sandboxActor({
    if (sandboxProviderId === "e2b") {
      return e2b({
        create: () => ({
-          template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.3.x",
+          template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.5.x",
          envs: sandboxEnvObject(),
          // TEMPORARY: Default E2B timeout is 5 minutes which is too short.
          // Set to 1 hour as a stopgap. Remove this once the E2B provider in
@ -264,7 +269,7 @@ async function providerForConnection(c: any): Promise<any | null> {
    sandboxProviderId === "e2b"
      ? e2b({
          create: () => ({
-            template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.3.x",
+            template: config.sandboxProviders.e2b.template ?? "sandbox-agent-full-0.5.x",
            envs: sandboxEnvObject(),
          }),
          installAgents: ["claude", "codex"],
@ -297,6 +302,43 @@ async function listWorkspaceModelGroupsForSandbox(c: any): Promise<WorkspaceMode

 const baseActions = baseTaskSandbox.config.actions as Record<string, (c: any, ...args: any[]) => Promise<any>>;

+// ---------------------------------------------------------------------------
+// Dynamic repo CWD resolution
+// ---------------------------------------------------------------------------
+
+let cachedRepoCwd: string | null = null;
+
+/**
+ * Resolve the repo CWD inside the sandbox by querying `$HOME`.
+ * Different providers run as different users (E2B: `/home/user`, local Docker:
+ * `/home/sandbox`), so the path must be resolved dynamically. The result is
+ * cached for the lifetime of this sandbox actor instance.
+ */
+async function resolveRepoCwd(c: any): Promise<string> {
+  if (cachedRepoCwd) return cachedRepoCwd;
+
+  try {
+    const result = await baseActions.runProcess(c, {
+      command: "bash",
+      args: ["-lc", "echo $HOME"],
+      cwd: "/",
+      timeoutMs: 10_000,
+    });
+    const home = (result.stdout ?? result.result ?? "").trim();
+    if (home && home.startsWith("/")) {
+      cachedRepoCwd = `${home}/repo`;
+      return cachedRepoCwd;
+    }
+  } catch (error) {
+    logActorWarning("taskSandbox", "failed to resolve $HOME, using default", {
+      error: resolveErrorMessage(error),
+    });
+  }
+
+  cachedRepoCwd = DEFAULT_SANDBOX_REPO_CWD;
+  return cachedRepoCwd;
+}
+
 // ---------------------------------------------------------------------------
 // Queue names for sandbox actor
 // ---------------------------------------------------------------------------
@ -528,8 +570,9 @@ export const taskSandbox = actor({
      }
    },

-    async repoCwd(): Promise<{ cwd: string }> {
-      return { cwd: SANDBOX_REPO_CWD };
+    async repoCwd(c: any): Promise<{ cwd: string }> {
+      const resolved = await resolveRepoCwd(c);
+      return { cwd: resolved };
    },

    // Long-running action — kept as direct action to avoid blocking the
@ -600,4 +643,4 @@ export const taskSandbox = actor({
  run: workflow(runSandboxWorkflow),
 });

-export { SANDBOX_REPO_CWD };
+export { DEFAULT_SANDBOX_REPO_CWD, resolveRepoCwd };
--- a/foundry/packages/backend/src/actors/task/workspace.ts
+++ b/foundry/packages/backend/src/actors/task/workspace.ts
@ -1,6 +1,6 @@
 // @ts-nocheck
 import { randomUUID } from "node:crypto";
-import { basename, dirname } from "node:path";
+import { basename } from "node:path";
 import { asc, eq } from "drizzle-orm";
 import {
  DEFAULT_WORKSPACE_MODEL_GROUPS,
@ -10,8 +10,7 @@ import {
 } from "@sandbox-agent/foundry-shared";
 import { getActorRuntimeContext } from "../context.js";
 import { getOrCreateOrganization, getOrCreateTaskSandbox, getOrCreateUser, getTaskSandbox, selfTask } from "../handles.js";
-import { logActorWarning, resolveErrorMessage } from "../logging.js";
-import { SANDBOX_REPO_CWD } from "../sandbox/index.js";
+import { logActorInfo, logActorWarning, resolveErrorMessage } from "../logging.js";
 import { resolveSandboxProviderId } from "../../sandbox-config.js";
 import { getBetterAuthService } from "../../services/better-auth.js";
 import { resolveOrganizationGithubAuth } from "../../services/github-auth.js";
@ -183,9 +182,9 @@ async function injectGitCredentials(sandbox: any, login: string, email: string,
    "set -euo pipefail",
    `git config --global user.name ${JSON.stringify(login)}`,
    `git config --global user.email ${JSON.stringify(email)}`,
-    `git config --global credential.helper 'store --file=/home/sandbox/.git-token'`,
-    `printf '%s\\n' ${JSON.stringify(`https://${login}:${token}@github.com`)} > /home/sandbox/.git-token`,
-    `chmod 600 /home/sandbox/.git-token`,
+    `git config --global credential.helper 'store --file=$HOME/.git-token'`,
+    `printf '%s\\n' ${JSON.stringify(`https://${login}:${token}@github.com`)} > $HOME/.git-token`,
+    `chmod 600 $HOME/.git-token`,
  ];
  const result = await sandbox.runProcess({
    command: "bash",
@ -576,6 +575,10 @@ async function getTaskSandboxRuntime(
  const sandbox = await getOrCreateTaskSandbox(c, c.state.organizationId, sandboxId, {});
  const actorId = typeof sandbox.resolve === "function" ? await sandbox.resolve().catch(() => null) : null;
  const switchTarget = sandboxProviderId === "local" ? `sandbox://local/${sandboxId}` : `sandbox://e2b/${sandboxId}`;
+
+  // Resolve the actual repo CWD from the sandbox's $HOME (differs by provider).
+  const repoCwdResult = await sandbox.repoCwd();
+  const cwd = repoCwdResult?.cwd ?? "$HOME/repo";
  const now = Date.now();

  await c.db
@ -585,7 +588,7 @@ async function getTaskSandboxRuntime(
      sandboxProviderId,
      sandboxActorId: typeof actorId === "string" ? actorId : null,
      switchTarget,
-      cwd: SANDBOX_REPO_CWD,
+      cwd,
      createdAt: now,
      updatedAt: now,
    })
@ -595,7 +598,7 @@ async function getTaskSandboxRuntime(
        sandboxProviderId,
        sandboxActorId: typeof actorId === "string" ? actorId : null,
        switchTarget,
-        cwd: SANDBOX_REPO_CWD,
+        cwd,
        updatedAt: now,
      },
    })
@ -606,7 +609,7 @@ async function getTaskSandboxRuntime(
    .set({
      activeSandboxId: sandboxId,
      activeSwitchTarget: switchTarget,
-      activeCwd: SANDBOX_REPO_CWD,
+      activeCwd: cwd,
      updatedAt: now,
    })
    .where(eq(taskRuntime.id, 1))
@ -617,7 +620,7 @@ async function getTaskSandboxRuntime(
    sandboxId,
    sandboxProviderId,
    switchTarget,
-    cwd: SANDBOX_REPO_CWD,
+    cwd,
  };
 }

@ -636,27 +639,35 @@ async function ensureSandboxRepo(c: any, sandbox: any, record: any, opts?: { ski
  // If the repo was already prepared and the caller allows skipping fetch, just return.
  // The clone, fetch, and checkout already happened on a prior call.
  if (opts?.skipFetchIfPrepared && sandboxRepoPrepared) {
+    logActorInfo("task.sandbox", "ensureSandboxRepo skipped (already prepared)");
    return;
  }

+  const repoStart = performance.now();
+
+  const t0 = performance.now();
  const auth = await resolveOrganizationGithubAuth(c, c.state.organizationId);
  const metadata = await getRepositoryMetadata(c);
+  logActorInfo("task.sandbox", "resolveAuth+metadata", { durationMs: Math.round(performance.now() - t0) });
+
  const baseRef = metadata.defaultBranch ?? "main";
-  const sandboxRepoRoot = dirname(SANDBOX_REPO_CWD);
+  // Use $HOME inside the shell script so the path resolves correctly regardless
+  // of which user the sandbox runs as (E2B: "user", local Docker: "sandbox").
  const script = [
    "set -euo pipefail",
-    `mkdir -p ${JSON.stringify(sandboxRepoRoot)}`,
+    'REPO_DIR="$HOME/repo"',
+    'mkdir -p "$HOME"',
    "git config --global credential.helper '!f() { echo username=x-access-token; echo password=${GH_TOKEN:-$GITHUB_TOKEN}; }; f'",
-    `if [ ! -d ${JSON.stringify(`${SANDBOX_REPO_CWD}/.git`)} ]; then rm -rf ${JSON.stringify(SANDBOX_REPO_CWD)} && git clone ${JSON.stringify(
-      metadata.remoteUrl,
-    )} ${JSON.stringify(SANDBOX_REPO_CWD)}; fi`,
-    `cd ${JSON.stringify(SANDBOX_REPO_CWD)}`,
+    `if [ ! -d "$REPO_DIR/.git" ]; then rm -rf "$REPO_DIR" && git clone ${JSON.stringify(metadata.remoteUrl)} "$REPO_DIR"; fi`,
+    'cd "$REPO_DIR"',
    "git fetch origin --prune",
    `if git show-ref --verify --quiet refs/remotes/origin/${JSON.stringify(record.branchName).slice(1, -1)}; then target_ref=${JSON.stringify(
      `origin/${record.branchName}`,
    )}; else target_ref=${JSON.stringify(baseRef)}; fi`,
    `git checkout -B ${JSON.stringify(record.branchName)} \"$target_ref\"`,
  ];
+
+  const t1 = performance.now();
  const result = await sandbox.runProcess({
    command: "bash",
    args: ["-lc", script.join("; ")],
@ -669,6 +680,11 @@ async function ensureSandboxRepo(c: any, sandbox: any, record: any, opts?: { ski
      : undefined,
    timeoutMs: 5 * 60_000,
  });
+  logActorInfo("task.sandbox", "git clone/fetch/checkout", {
+    branch: record.branchName,
+    repo: metadata.remoteUrl,
+    durationMs: Math.round(performance.now() - t1),
+  });

  if ((result.exitCode ?? 0) !== 0) {
    throw new Error(`sandbox repo preparation failed (${result.exitCode ?? 1}): ${[result.stdout, result.stderr].filter(Boolean).join("")}`);
@ -677,10 +693,13 @@ async function ensureSandboxRepo(c: any, sandbox: any, record: any, opts?: { ski
  // On first repo preparation, inject the task owner's git credentials into the sandbox
  // so that push/commit operations are authenticated and attributed to the correct user.
  if (!sandboxRepoPrepared && opts?.authSessionId) {
+    const t2 = performance.now();
    await maybeSwapTaskOwner(c, opts.authSessionId, sandbox);
+    logActorInfo("task.sandbox", "maybeSwapTaskOwner", { durationMs: Math.round(performance.now() - t2) });
  }

  sandboxRepoPrepared = true;
+  logActorInfo("task.sandbox", "ensureSandboxRepo complete", { totalDurationMs: Math.round(performance.now() - repoStart) });
 }

 async function executeInSandbox(
@ -1264,6 +1283,7 @@ export async function createWorkspaceSession(c: any, model?: string, authSession
 }

 export async function ensureWorkspaceSession(c: any, sessionId: string, model?: string, authSessionId?: string): Promise<void> {
+  const ensureStart = performance.now();
  const meta = await readSessionMeta(c, sessionId);
  if (!meta || meta.closed) {
    return;
@ -1283,10 +1303,18 @@ export async function ensureWorkspaceSession(c: any, sessionId: string, model?:
  });

  try {
+    const t0 = performance.now();
    const runtime = await getTaskSandboxRuntime(c, record);
+    logActorInfo("task.session", "getTaskSandboxRuntime", { sessionId, durationMs: Math.round(performance.now() - t0) });
+
+    const t1 = performance.now();
    await ensureSandboxRepo(c, runtime.sandbox, record);
+    logActorInfo("task.session", "ensureSandboxRepo", { sessionId, durationMs: Math.round(performance.now() - t1) });
+
    const resolvedModel = model ?? meta.model ?? (await resolveDefaultModel(c, authSessionId));
    const resolvedAgent = await resolveSandboxAgentForModel(c, resolvedModel);
+
+    const t2 = performance.now();
    await runtime.sandbox.createSession({
      id: meta.sandboxSessionId ?? sessionId,
      agent: resolvedAgent,
@ -1295,12 +1323,14 @@ export async function ensureWorkspaceSession(c: any, sessionId: string, model?:
        cwd: runtime.cwd,
      },
    });
+    logActorInfo("task.session", "createSession", { sessionId, agent: resolvedAgent, model: resolvedModel, durationMs: Math.round(performance.now() - t2) });

    await updateSessionMeta(c, sessionId, {
      sandboxSessionId: meta.sandboxSessionId ?? sessionId,
      status: "ready",
      errorMessage: null,
    });
+    logActorInfo("task.session", "ensureWorkspaceSession complete", { sessionId, totalDurationMs: Math.round(performance.now() - ensureStart) });
    fireRefreshSessionTranscript(c, meta.sandboxSessionId ?? sessionId);
  } catch (error) {
    await updateSessionMeta(c, sessionId, {
@ -1415,12 +1445,19 @@ export async function changeWorkspaceModel(c: any, sessionId: string, model: str
 }

 export async function sendWorkspaceMessage(c: any, sessionId: string, text: string, attachments: Array<any>, authSessionId?: string): Promise<void> {
+  const sendStart = performance.now();
  const meta = requireSendableSessionMeta(await readSessionMeta(c, sessionId), sessionId);
  const record = await ensureWorkspaceSeeded(c);
+
+  const t0 = performance.now();
  const runtime = await getTaskSandboxRuntime(c, record);
+  logActorInfo("task.message", "getTaskSandboxRuntime", { sessionId, durationMs: Math.round(performance.now() - t0) });
+
+  const t1 = performance.now();
  // Skip git fetch on subsequent messages — the repo was already prepared during session
  // creation. This avoids a 5-30s network round-trip to GitHub on every prompt.
  await ensureSandboxRepo(c, runtime.sandbox, record, { skipFetchIfPrepared: true, authSessionId });
+  logActorInfo("task.message", "ensureSandboxRepo", { sessionId, durationMs: Math.round(performance.now() - t1) });

  // Check if the task owner needs to swap. If a different user is sending this message,
  // update the owner record and inject their git credentials into the sandbox.
@ -1450,10 +1487,12 @@ export async function sendWorkspaceMessage(c: any, sessionId: string, text: stri
  await syncWorkspaceSessionStatus(c, meta.sandboxSessionId, "running", Date.now());

  try {
+    const t2 = performance.now();
    await runtime.sandbox.sendPrompt({
      sessionId: meta.sandboxSessionId,
      prompt: prompt.join("\n\n"),
    });
+    logActorInfo("task.message", "sendPrompt", { sessionId, durationMs: Math.round(performance.now() - t2) });
    await syncWorkspaceSessionStatus(c, meta.sandboxSessionId, "idle", Date.now());
  } catch (error) {
    await updateSessionMeta(c, sessionId, {
@ -1463,6 +1502,7 @@ export async function sendWorkspaceMessage(c: any, sessionId: string, text: stri
    await syncWorkspaceSessionStatus(c, meta.sandboxSessionId, "error", Date.now());
    throw error;
  }
+  logActorInfo("task.message", "sendWorkspaceMessage complete", { sessionId, totalDurationMs: Math.round(performance.now() - sendStart) });
 }

 export async function stopWorkspaceSession(c: any, sessionId: string): Promise<void> {
--- a/foundry/packages/backend/src/config/runner-version.ts
+++ b/foundry/packages/backend/src/config/runner-version.ts
@ -0,0 +1,33 @@
+import { readFileSync } from "node:fs";
+
+function parseRunnerVersion(rawValue: string | undefined): number | undefined {
+  const value = rawValue?.trim();
+  if (!value) {
+    return undefined;
+  }
+
+  const parsed = Number.parseInt(value, 10);
+  if (Number.isNaN(parsed)) {
+    return undefined;
+  }
+
+  return parsed;
+}
+
+export function resolveRunnerVersion(): number | undefined {
+  const envVersion = parseRunnerVersion(process.env.RIVET_RUNNER_VERSION);
+  if (envVersion !== undefined) {
+    return envVersion;
+  }
+
+  const versionFilePath = process.env.RIVET_RUNNER_VERSION_FILE;
+  if (!versionFilePath) {
+    return undefined;
+  }
+
+  try {
+    return parseRunnerVersion(readFileSync(versionFilePath, "utf8"));
+  } catch {
+    return undefined;
+  }
+}
--- a/foundry/packages/backend/src/index.ts
+++ b/foundry/packages/backend/src/index.ts
@ -141,6 +141,59 @@ export async function startBackend(options: BackendStartOptions = {}): Promise<v
  };
  app.use("/v1/*", cors(corsConfig));
  app.use("/v1", cors(corsConfig));
+
+  // On-demand memory snapshot endpoint for diagnosing spikes (dev only).
+  // Usage: curl http://127.0.0.1:7741/debug/memory
+  // Trigger GC first: curl http://127.0.0.1:7741/debug/memory?gc=1
+  // Write JSC heap snapshot: curl http://127.0.0.1:7741/debug/memory?heap=1
+  //   (writes /tmp/foundry-heap-<timestamp>.json, inspect with chrome://tracing)
+  app.get("/debug/memory", async (c) => {
+    if (process.env.NODE_ENV !== "development") {
+      return c.json({ error: "debug endpoints disabled in production" }, 403);
+    }
+    const wantGc = c.req.query("gc") === "1";
+    if (wantGc && typeof Bun !== "undefined") {
+      // Bun.gc(true) triggers a synchronous full GC sweep in JavaScriptCore.
+      Bun.gc(true);
+    }
+    const mem = process.memoryUsage();
+    const rssMb = Math.round(mem.rss / 1024 / 1024);
+    const heapUsedMb = Math.round(mem.heapUsed / 1024 / 1024);
+    const heapTotalMb = Math.round(mem.heapTotal / 1024 / 1024);
+    const externalMb = Math.round(mem.external / 1024 / 1024);
+    const nonHeapMb = rssMb - heapUsedMb - externalMb;
+    // Bun.heapStats() gives JSC-specific breakdown: object counts, typed array
+    // bytes, extra memory (native allocations tracked by JSC). Useful for
+    // distinguishing JS object bloat from native/WASM memory.
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    const BunAny = Bun as any;
+    const heapStats = typeof BunAny.heapStats === "function" ? BunAny.heapStats() : null;
+    const snapshot = {
+      rssMb,
+      heapUsedMb,
+      heapTotalMb,
+      externalMb,
+      nonHeapMb,
+      gcTriggered: wantGc,
+      rssBytes: mem.rss,
+      heapUsedBytes: mem.heapUsed,
+      heapTotalBytes: mem.heapTotal,
+      externalBytes: mem.external,
+      ...(heapStats ? { bunHeapStats: heapStats } : {}),
+    };
+    // Optionally write a full JSC heap snapshot for offline analysis.
+    let heapSnapshotPath: string | null = null;
+    const wantHeap = c.req.query("heap") === "1";
+    if (wantHeap && typeof Bun !== "undefined") {
+      heapSnapshotPath = `/tmp/foundry-heap-${Date.now()}.json`;
+      // Bun.generateHeapSnapshot("v8") returns a V8-compatible JSON string.
+      const heapJson = Bun.generateHeapSnapshot("v8");
+      await Bun.write(heapSnapshotPath, heapJson);
+    }
+    logger.info(snapshot, "memory_usage_debug");
+    return c.json({ ...snapshot, ...(heapSnapshotPath ? { heapSnapshotPath } : {}) });
+  });
+
  app.use("*", async (c, next) => {
    const requestId = c.req.header("x-request-id")?.trim() || randomUUID();
    const start = performance.now();
@ -354,6 +407,11 @@ export async function startBackend(options: BackendStartOptions = {}): Promise<v
    },
    hostname: config.backend.host,
    port: config.backend.port,
+    // Bun defaults to 10s idle timeout. Actor RPCs go through the gateway
+    // tunnel (not direct HTTP), and the SSE stream has a 1s ping interval
+    // (RUNNER_SSE_PING_INTERVAL in rivetkit), so the idle timeout likely
+    // never fires in practice. Set high as a safety net regardless.
+    idleTimeout: 255,
  });

  logger.info(
@ -364,6 +422,42 @@ export async function startBackend(options: BackendStartOptions = {}): Promise<v
    "backend_started",
  );

+  // Periodic memory usage reporting for diagnosing memory spikes (dev only).
+  // Logs JS heap, RSS, and external (native/WASM) separately so we can tell
+  // whether spikes come from JS objects, Bun/JSC internals, or native addons
+  // like SQLite/WASM.
+  if (process.env.NODE_ENV === "development") {
+    let prevRss = 0;
+    setInterval(() => {
+      const mem = process.memoryUsage();
+      const rssMb = Math.round(mem.rss / 1024 / 1024);
+      const heapUsedMb = Math.round(mem.heapUsed / 1024 / 1024);
+      const heapTotalMb = Math.round(mem.heapTotal / 1024 / 1024);
+      const externalMb = Math.round(mem.external / 1024 / 1024);
+      // Non-heap RSS: memory not accounted for by JS heap or external buffers.
+      // Large values here point to native allocations (WASM, mmap, child process
+      // bookkeeping, Bun's internal arena, etc.).
+      const nonHeapMb = rssMb - heapUsedMb - externalMb;
+      const deltaRss = rssMb - prevRss;
+      prevRss = rssMb;
+      logger.info(
+        {
+          rssMb,
+          heapUsedMb,
+          heapTotalMb,
+          externalMb,
+          nonHeapMb,
+          deltaRssMb: deltaRss,
+          rssBytes: mem.rss,
+          heapUsedBytes: mem.heapUsed,
+          heapTotalBytes: mem.heapTotal,
+          externalBytes: mem.external,
+        },
+        "memory_usage",
+      );
+    }, 60_000);
+  }
+
  process.on("SIGINT", async () => {
    server.stop();
    process.exit(0);
--- a/foundry/packages/client/package.json
+++ b/foundry/packages/client/package.json
@ -6,7 +6,7 @@
  "main": "dist/index.js",
  "types": "dist/index.d.ts",
  "scripts": {
-    "build": "tsup src/index.ts --format esm --dts",
+    "build": "tsup src/index.ts --format esm --dts --tsconfig tsconfig.build.json",
    "typecheck": "tsc --noEmit",
    "test": "vitest run",
    "test:e2e:full": "HF_ENABLE_DAEMON_FULL_E2E=1 vitest run test/e2e/full-integration-e2e.test.ts",
--- a/foundry/packages/client/src/subscription/remote-manager.ts
+++ b/foundry/packages/client/src/subscription/remote-manager.ts
@ -4,6 +4,11 @@ import { topicDefinitions, type TopicData, type TopicDefinition, type TopicKey,

 const GRACE_PERIOD_MS = 30_000;

+/** Initial retry delay in ms. */
+const RETRY_BASE_MS = 1_000;
+/** Maximum retry delay in ms. */
+const RETRY_MAX_MS = 30_000;
+
 /**
 * Remote implementation of SubscriptionManager.
 * Each cache entry owns one actor connection plus one materialized snapshot.
@ -80,9 +85,12 @@ class TopicEntry<TData, TParams, TEvent> {
  private unsubscribeEvent: (() => void) | null = null;
  private unsubscribeError: (() => void) | null = null;
  private teardownTimer: ReturnType<typeof setTimeout> | null = null;
+  private retryTimer: ReturnType<typeof setTimeout> | null = null;
+  private retryAttempt = 0;
  private startPromise: Promise<void> | null = null;
  private eventPromise: Promise<void> = Promise.resolve();
  private started = false;
+  private disposed = false;

  constructor(
    private readonly topicKey: TopicKey,
@ -136,7 +144,9 @@ class TopicEntry<TData, TParams, TEvent> {
  }

  dispose(): void {
+    this.disposed = true;
    this.cancelTeardown();
+    this.cancelRetry();
    this.unsubscribeEvent?.();
    this.unsubscribeError?.();
    if (this.conn) {
@ -148,6 +158,55 @@ class TopicEntry<TData, TParams, TEvent> {
    this.error = null;
    this.lastRefreshAt = null;
    this.started = false;
+    this.retryAttempt = 0;
+  }
+
+  private cancelRetry(): void {
+    if (this.retryTimer) {
+      clearTimeout(this.retryTimer);
+      this.retryTimer = null;
+    }
+  }
+
+  /**
+   * Schedules a retry with exponential backoff. Cleans up any existing
+   * connection state before reconnecting.
+   */
+  private scheduleRetry(): void {
+    if (this.disposed || this.listenerCount === 0) {
+      return;
+    }
+
+    const delay = Math.min(RETRY_BASE_MS * 2 ** this.retryAttempt, RETRY_MAX_MS);
+    this.retryAttempt++;
+
+    this.retryTimer = setTimeout(() => {
+      this.retryTimer = null;
+      if (this.disposed || this.listenerCount === 0) {
+        return;
+      }
+
+      // Tear down the old connection before retrying
+      this.cleanupConnection();
+      this.started = false;
+      this.startPromise = this.start().finally(() => {
+        this.startPromise = null;
+      });
+    }, delay);
+  }
+
+  /**
+   * Cleans up connection resources without resetting data/status/retry state.
+   */
+  private cleanupConnection(): void {
+    this.unsubscribeEvent?.();
+    this.unsubscribeError?.();
+    this.unsubscribeEvent = null;
+    this.unsubscribeError = null;
+    if (this.conn) {
+      void this.conn.dispose();
+    }
+    this.conn = null;
  }

  private async start(): Promise<void> {
@ -164,17 +223,20 @@ class TopicEntry<TData, TParams, TEvent> {
        this.status = "error";
        this.error = error instanceof Error ? error : new Error(String(error));
        this.notify();
+        this.scheduleRetry();
      });
      this.data = await this.definition.fetchInitial(this.backend, this.params);
      this.status = "connected";
      this.lastRefreshAt = Date.now();
      this.started = true;
+      this.retryAttempt = 0;
      this.notify();
    } catch (error) {
      this.status = "error";
      this.error = error instanceof Error ? error : new Error(String(error));
      this.started = false;
      this.notify();
+      this.scheduleRetry();
    }
  }

--- a/foundry/packages/client/tsconfig.build.json
+++ b/foundry/packages/client/tsconfig.build.json
@ -0,0 +1,6 @@
+{
+  "extends": "./tsconfig.json",
+  "compilerOptions": {
+    "ignoreDeprecations": "6.0"
+  }
+}
--- a/foundry/packages/frontend/src/components/mock-layout.tsx
+++ b/foundry/packages/frontend/src/components/mock-layout.tsx
@ -187,6 +187,7 @@ function toTaskModel(
    diffs: detail?.diffs ?? {},
    fileTree: detail?.fileTree ?? [],
    minutesUsed: detail?.minutesUsed ?? 0,
+    sandboxes: detail?.sandboxes ?? [],
    activeSandboxId: detail?.activeSandboxId ?? null,
    primaryUserLogin: detail?.primaryUserLogin ?? summary.primaryUserLogin ?? null,
    primaryUserAvatarUrl: detail?.primaryUserAvatarUrl ?? summary.primaryUserAvatarUrl ?? null,
--- a/foundry/packages/shared/package.json
+++ b/foundry/packages/shared/package.json
@ -6,7 +6,7 @@
  "main": "dist/index.js",
  "types": "dist/index.d.ts",
  "scripts": {
-    "build": "tsup src/index.ts --format esm --dts",
+    "build": "tsup src/index.ts --format esm --dts --tsconfig tsconfig.build.json",
    "typecheck": "tsc --noEmit",
    "test": "vitest run"
  },
--- a/foundry/packages/shared/tsconfig.build.json
+++ b/foundry/packages/shared/tsconfig.build.json
@ -0,0 +1,6 @@
+{
+  "extends": "./tsconfig.json",
+  "compilerOptions": {
+    "ignoreDeprecations": "6.0"
+  }
+}
--- a/foundry/research/friction/sandbox-agent.mdx
+++ b/foundry/research/friction/sandbox-agent.mdx
@ -55,7 +55,7 @@ Upgrading backend integration from legacy sandbox-agent session endpoints to `sa

 ### Friction / Issue

-`0.2.0` no longer exposes `/v1/sessions` endpoints used by the backend integration; direct session create/status polling via legacy REST paths returns `404`.
+`0.2.0` no longer exposes the legacy session REST endpoints used by the backend integration; direct session create/status polling via those paths returns `404`.

 ### Attempted Fix / Workaround

@ -65,5 +65,5 @@ Upgrading backend integration from legacy sandbox-agent session endpoints to `sa

 ### Outcome

- Backend no longer depends on removed `/v1/sessions` endpoints.
+- Backend no longer depends on removed legacy session REST endpoints.
 - Daytona flow is aligned with `sandbox-agent 0.2.0` runtime and SDK usage.
--- a/frontend/packages/website/src/components/GetStarted.tsx
+++ b/frontend/packages/website/src/components/GetStarted.tsx
@ -103,7 +103,7 @@ function SdkCodeHighlighted() {
  );
 }

-const sandboxCommand = `curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh`;
+const sandboxCommand = `curl -fsSL https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh | sh`;

 const sourceCommands = `git clone https://github.com/rivet-dev/sandbox-agent
 cd sandbox-agent
@ -196,7 +196,7 @@ export function GetStarted() {
                    <span className="text-zinc-300">curl -fsSL \</span>
                    {"\n"}
                    <span className="text-zinc-300">{"    "}</span>
-                    <span className="text-green-400">https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh</span>
+                    <span className="text-green-400">https://releases.rivet.dev/sandbox-agent/0.4.x/install.sh</span>
                    <span className="text-zinc-300"> | </span>
                    <span className="text-blue-400">sh</span>
                  </code>
--- a/1
+++ b/1
@ -186,4 +186,3 @@ foundry-format:
 [group('foundry')]
 foundry-docker-build tag='foundry:local':
 	docker build -f foundry/docker/backend.Dockerfile -t {{tag}} .
-
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@ -450,6 +450,31 @@ importers:
        specifier: latest
        version: 5.9.3

+  examples/sprites:
+    dependencies:
+      '@fly/sprites':
+        specifier: latest
+        version: 0.0.1
+      '@sandbox-agent/example-shared':
+        specifier: workspace:*
+        version: link:../shared
+      sandbox-agent:
+        specifier: workspace:*
+        version: link:../../sdks/typescript
+    devDependencies:
+      '@types/node':
+        specifier: latest
+        version: 25.5.0
+      tsx:
+        specifier: latest
+        version: 4.21.0
+      typescript:
+        specifier: latest
+        version: 6.0.2
+      vitest:
+        specifier: ^3.0.0
+        version: 3.2.4(@types/debug@4.1.12)(@types/node@25.5.0)(jiti@1.21.7)(jsdom@26.1.0)(tsx@4.21.0)(yaml@2.8.2)
+
  examples/vercel:
    dependencies:
      '@sandbox-agent/example-shared':
@ -531,7 +556,7 @@ importers:
        version: 1.3.10
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)

  foundry/packages/client:
    dependencies:
@ -553,7 +578,7 @@ importers:
        version: 19.2.14
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)

  foundry/packages/frontend:
    dependencies:
@ -614,7 +639,7 @@ importers:
        version: 0.1.27(@types/react@19.2.14)(react@19.2.4)
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)
      vite:
        specifier: ^7.1.3
        version: 7.3.1(@types/node@25.5.0)(jiti@1.21.7)(tsx@4.21.0)(yaml@2.8.2)
@ -633,7 +658,7 @@ importers:
    devDependencies:
      tsup:
        specifier: ^8.5.0
-        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@5.9.3)(yaml@2.8.2)
+        version: 8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2)

  frontend/packages/inspector:
    dependencies:
@ -771,25 +796,6 @@ importers:
        specifier: ^5.7.0
        version: 5.9.3

-  scripts/sandbox-testing:
-    dependencies:
-      '@daytonaio/sdk':
-        specifier: latest
-        version: 0.151.0(ws@8.19.0)
-      '@e2b/code-interpreter':
-        specifier: latest
-        version: 2.3.3
-    devDependencies:
-      '@types/node':
-        specifier: latest
-        version: 25.5.0
-      tsx:
-        specifier: latest
-        version: 4.21.0
-      typescript:
-        specifier: latest
-        version: 5.9.3
-
  sdks/acp-http-client:
    dependencies:
      '@agentclientprotocol/sdk':
@ -988,6 +994,9 @@ importers:
      '@e2b/code-interpreter':
        specifier: '>=1.0.0'
        version: 2.3.3
+      '@fly/sprites':
+        specifier: '>=0.0.1'
+        version: 0.0.1
      '@types/dockerode':
        specifier: ^4.0.0
        version: 4.0.1
@ -2487,6 +2496,10 @@ packages:
    resolution: {integrity: sha512-vBZP4NlzfOlerQTnba4aqZoMhE/a9HY7HRqoOPaETQcSQuWEIyZMHGfVu6w9wGtGK5fED5qRs2DteVCjOH60sA==}
    engines: {node: '>=14'}

+  '@fly/sprites@0.0.1':
+    resolution: {integrity: sha512-1s+dIVi/pTMP4Aj4Mkg+4LoZ/+a0Kp6l9piPRxvpgEKm11b/eRiZgJwVytwAHeI/vtg2fuwcFExjtXOEfny/TA==}
+    engines: {node: '>=24.0.0'}
+
  '@grpc/grpc-js@1.14.3':
    resolution: {integrity: sha512-Iq8QQQ/7X3Sac15oB6p0FmUg/klxQvXLeileoqrTRGJYLV+/9tubbr9ipz0GKHjmXVsgFPo/+W+2cA8eNcR+XA==}
    engines: {node: '>=12.10.0'}
@ -6937,6 +6950,11 @@ packages:
    engines: {node: '>=14.17'}
    hasBin: true

+  typescript@6.0.2:
+    resolution: {integrity: sha512-bGdAIrZ0wiGDo5l8c++HWtbaNCWTS4UTv7RaTH/ThVIgjkveJt83m74bBHMJkuCbslY8ixgLBVZJIOiQlQTjfQ==}
+    engines: {node: '>=14.17'}
+    hasBin: true
+
  ufo@1.6.3:
    resolution: {integrity: sha512-yDJTmhydvl5lJzBmy/hyOAA0d+aqCBuwl818haVdYCRrWV84o7YyeVm4QlVHStqNrrJSTb6jKuFAVqAFsr+K3Q==}

@ -8975,6 +8993,8 @@ snapshots:

  '@fastify/busboy@2.1.1': {}

+  '@fly/sprites@0.0.1': {}
+
  '@grpc/grpc-js@1.14.3':
    dependencies:
      '@grpc/proto-loader': 0.8.0
@ -14144,6 +14164,34 @@ snapshots:
      - tsx
      - yaml

+  tsup@8.5.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(typescript@6.0.2)(yaml@2.8.2):
+    dependencies:
+      bundle-require: 5.1.0(esbuild@0.27.3)
+      cac: 6.7.14
+      chokidar: 4.0.3
+      consola: 3.4.2
+      debug: 4.4.3
+      esbuild: 0.27.3
+      fix-dts-default-cjs-exports: 1.0.1
+      joycon: 3.1.1
+      picocolors: 1.1.1
+      postcss-load-config: 6.0.1(jiti@1.21.7)(postcss@8.5.6)(tsx@4.21.0)(yaml@2.8.2)
+      resolve-from: 5.0.0
+      rollup: 4.56.0
+      source-map: 0.7.6
+      sucrase: 3.35.1
+      tinyexec: 0.3.2
+      tinyglobby: 0.2.15
+      tree-kill: 1.2.2
+    optionalDependencies:
+      postcss: 8.5.6
+      typescript: 6.0.2
+    transitivePeerDependencies:
+      - jiti
+      - supports-color
+      - tsx
+      - yaml
+
  tsx@4.21.0:
    dependencies:
      esbuild: 0.27.3
@ -14194,6 +14242,8 @@ snapshots:

  typescript@5.9.3: {}

+  typescript@6.0.2: {}
+
  ufo@1.6.3: {}

  ultrahtml@1.6.0: {}
--- a/pnpm-workspace.yaml
+++ b/pnpm-workspace.yaml
@ -10,6 +10,5 @@ packages:
  - "sdks/gigacode/platforms/*"
  - "resources/vercel-ai-sdk-schemas"
  - "scripts/release"
-  - "scripts/sandbox-testing"
  - "examples/*"
  - "server/packages/sandbox-agent/tests/opencode-compat"
--- a/research/acp/friction.md
+++ b/research/acp/friction.md
@ -81,7 +81,7 @@ Update this file continuously during the migration.
 - Date: 2026-02-10
 - Area: Session lifecycle surface
 - Issue: ACP stable does not include v1-equivalent methods for session listing, explicit session termination/delete, or event-log polling.
- Impact: Direct lift-and-shift of `/v1/sessions`, `/terminate`, and `/events` polling is not possible with ACP core only.
+- Impact: Direct lift-and-shift of the legacy session REST list, terminate, and event-polling behavior is not possible with ACP core only.
 - Proposed direction: Define `_sandboxagent/session/*` extension methods for these control operations, while keeping core prompt flow on standard ACP methods.
 - Decision: Open.
 - Owner: Unassigned.
--- a/research/acp/inspector-unimplemented.md
+++ b/research/acp/inspector-unimplemented.md
@ -11,4 +11,4 @@ This tracks legacy inspector behaviors that do not yet have full parity on ACP v
 5. TDOO: Agent mode discovery before creating a session is not implemented (inspector currently returns cached-or-empty mode lists).
 6. TDOO: Agent model discovery before creating a session is not implemented (inspector currently returns cached-or-empty model lists).
 7. TDOO: Session listing only reflects sessions created by this inspector client instance (not full server/global session inventory).
-8. TDOO: Event history shown in inspector is synthesized from ACP traffic handled by the inspector compatibility layer, not the old canonical `/v1/sessions/*/events` backend history.
+8. TDOO: Event history shown in inspector is synthesized from ACP traffic handled by the inspector compatibility layer, not the old canonical session-events backend history.
--- a/research/acp/merge-acp.md
+++ b/research/acp/merge-acp.md
@ -20,8 +20,8 @@ Static v1 endpoints today:

 - `GET /v1/agents`
 - `POST /v1/agents/:agent/install`
- `GET /v1/sessions`
- `GET /v1/sessions/:session_id`
+- legacy session list endpoint
+- legacy session detail endpoint
 - `GET /v1/fs/entries`
 - `GET /v1/fs/file`
 - `PUT /v1/fs/file`
@ -76,8 +76,8 @@ Interpretation for clients: all agent/session operations and non-binary filesyst
 | --- | --- | --- |
 | `GET /v1/agents` | `_sandboxagent/agent/list` | Response keeps current `AgentListResponse` shape for low migration risk. |
 | `POST /v1/agents/:agent/install` | `_sandboxagent/agent/install` | Params include `agent`, `reinstall`, `agentVersion`, `agentProcessVersion`. |
-| `GET /v1/sessions` | `_sandboxagent/session/list` | Return current `SessionListResponse` shape (not ACP unstable list shape). |
-| `GET /v1/sessions/:session_id` | `_sandboxagent/session/get` | Return current `SessionInfo` shape; error on missing session. |
+| legacy session list endpoint | `_sandboxagent/session/list` | Return current `SessionListResponse` shape (not ACP unstable list shape). |
+| legacy session detail endpoint | `_sandboxagent/session/get` | Return current `SessionInfo` shape; error on missing session. |
 | `GET /v1/fs/entries` | `_sandboxagent/fs/list_entries` | Preserve path + optional `sessionId` resolution semantics. |
 | `GET /v1/fs/file` | keep HTTP + `_sandboxagent/fs/read_file` | HTTP is primary because responses may require large streaming reads; ACP variant exists for compatibility/smaller payloads. |
 | `PUT /v1/fs/file` | keep HTTP + `_sandboxagent/fs/write_file` | HTTP is primary for large binary writes; ACP variant exists for compatibility/smaller payloads. |
@ -143,7 +143,7 @@ Package boundary after migration:

 - `acp-http-client` remains protocol-pure ACP transport and generic `extMethod`/`extNotification`.
 - `sandbox-agent` remains the typed wrapper that maps convenience methods to `_sandboxagent/...` extension methods.
- No direct `/v1/agents*`, `/v1/sessions*`, or non-binary `/v1/fs/*` fetches in SDK runtime code.
+- No direct legacy agents/session REST fetches or non-binary `/v1/fs/*` fetches in SDK runtime code.
 - Binary file transfer keeps direct HTTP fetches on the three endpoints listed above.
 - SDK policy: prefer HTTP for `readFsFile`/`writeFsFile`/`uploadFsBatch` even if ACP extension variants exist.

@ -184,17 +184,17 @@ Alternative (optional): introduce a runtime-only control connection mode that do
 - TypeScript SDK (`sdks/typescript/src/client.ts`):
  - Repoint `listAgents`, `installAgent`, `listSessions`, `getSession`, `listFsEntries`, `deleteFsEntry`, `mkdirFs`, `moveFs`, and `statFs` to ACP extension calls.
  - Keep `readFsFile`, `writeFsFile`, and `uploadFsBatch` on HTTP endpoints.
-  - Remove direct runtime fetch usage for `/v1/agents*`, `/v1/sessions*`, and non-binary `/v1/fs/*`.
+  - Remove direct runtime fetch usage for legacy agents/session REST endpoints and non-binary `/v1/fs/*`.
  - Keep method names stable for callers.
  - Move these methods to connected-only semantics (`NotConnectedError` when disconnected).
 - CLI (`server/packages/sandbox-agent/src/cli.rs`):
-  - Make `api agents list/install` call ACP extension methods (via ACP post flow), not direct `/v1/agents*` HTTP calls.
+  - Make `api agents list/install` call ACP extension methods (via ACP post flow), not direct legacy agent HTTP calls.
 - Inspector flow/docs:
  - Stop depending on `GET /v1/agents` in startup path; use ACP extension instead.

 ### Phase 3: Remove Static Endpoints (Except Health + Binary FS Transfer)

- Remove route registrations for `/v1/agents*`, `/v1/sessions*`, `/v1/fs/entries`, `/v1/fs/entry`, `/v1/fs/mkdir`, `/v1/fs/move`, `/v1/fs/stat` from `router.rs`.
+- Remove route registrations for legacy agent/session REST endpoints and `/v1/fs/entries`, `/v1/fs/entry`, `/v1/fs/mkdir`, `/v1/fs/move`, `/v1/fs/stat` from `router.rs`.
 - Keep `/v1/health`, `/v1/rpc`, `GET /v1/fs/file`, `PUT /v1/fs/file`, and `POST /v1/fs/upload-batch`.
 - Optional short deprecation period: convert removed routes to `410 Gone` with explicit extension method in `detail`.

@ -237,6 +237,6 @@ Inspector:

 ## Open Decisions

-1. Should removed `/v1/agents*`, `/v1/sessions*`, and non-binary `/v1/fs/*` return `410` for one release or be dropped immediately?
+1. Should removed legacy agent/session REST endpoints and non-binary `/v1/fs/*` return `410` for one release or be dropped immediately?
 2. Do we keep a strict response-shape parity layer for session/file methods, or normalize to ACP-native shapes?
 3. Should `/` service-root remain as informational HTTP, or be treated as out-of-scope for this “only health static + binary fs transfer” policy?
--- a/research/acp/missing-features-spec/01-questions.md
+++ b/research/acp/missing-features-spec/01-questions.md
@ -59,11 +59,11 @@ struct PendingQuestion {
 }
 ```

-## v1 HTTP Endpoints (from `router.rs`)
+## Legacy Session REST Endpoints (from `router.rs`)

 ```
-POST /v1/sessions/{session_id}/questions/{question_id}/reply   -> 204 No Content
-POST /v1/sessions/{session_id}/questions/{question_id}/reject   -> 204 No Content
+session question reply endpoint   -> 204 No Content
+session question reject endpoint  -> 204 No Content
 ```

 ### `reply_question` handler
@ -122,7 +122,7 @@ Key flow:

 1. Agent emits `question.requested` event with `QuestionEventData { status: Requested, question_id, prompt, options }`
 2. Client renders question UI
-3. Client calls `POST /v1/sessions/{id}/questions/{qid}/reply` with `{ answers: [["selected"]] }` or `POST .../reject`
+3. Client calls the legacy session question reply or reject endpoint with `{ answers: [["selected"]] }`
 4. System emits `question.resolved` event with `QuestionEventData { status: Answered, response: Some("...") }` or `{ status: Rejected }`

 ## v1 Agent Capability
--- a/research/acp/missing-features-spec/07-session-termination.md
+++ b/research/acp/missing-features-spec/07-session-termination.md
@ -4,7 +4,7 @@

 ## Summary

-v1 had explicit session termination (`POST /v1/sessions/{id}/terminate`). v1 only has `session/cancel` (turn cancellation, not session kill) and `DELETE /v1/rpc` (connection close, not session termination). Need explicit session destroy/terminate semantics.
+The legacy session REST API had an explicit terminate endpoint. ACP only has `session/cancel` (turn cancellation, not session kill) and `DELETE /v1/rpc` (connection close, not session termination). Need explicit session destroy/terminate semantics.

 ## Current v1 State

@ -20,7 +20,7 @@ v1 had explicit session termination (`POST /v1/sessions/{id}/terminate`). v1 onl
 ### HTTP Endpoint

 ```
-POST /v1/sessions/{id}/terminate
+legacy session terminate endpoint
 ```

 ### Handler (from `router.rs`)
--- a/research/acp/missing-features-spec/08-model-variants.md
+++ b/research/acp/missing-features-spec/08-model-variants.md
@ -49,7 +49,7 @@ Returned `AgentModelsResponse` with full model list including variants.
 ### Session Creation with Variant

 ```
-POST /v1/sessions
+legacy session create endpoint
 ```

 Body included `variant: Option<String>` to select a specific model variant at session creation time.
--- a/research/acp/missing-features-spec/10-include-raw.md
+++ b/research/acp/missing-features-spec/10-include-raw.md
@ -34,7 +34,7 @@ pub struct UniversalEvent {
 ### v1 Usage

 ```
-GET /v1/sessions/{id}/events?include_raw=true
+legacy event polling endpoint with `include_raw=true`
 ```

 When `include_raw=true`, each `UniversalEvent` included the verbatim JSON the agent process emitted before normalization into the universal schema.
--- a/research/acp/missing-features-spec/16-session-info.md
+++ b/research/acp/missing-features-spec/16-session-info.md
@ -1,10 +1,10 @@
 # Feature 16: Session Info

-**Implementation approach:** New HTTP endpoints (`GET /v1/sessions`, `GET /v1/sessions/{id}`)
+**Implementation approach:** New session-info HTTP endpoints

 ## Summary

-v1 `SessionInfo` tracked `event_count`, `created_at`, `updated_at`, and full `mcp` config. v1 has session data in the ACP runtime's `MetaSession` struct but no HTTP endpoints to query it. Add REST endpoints for session listing and detail.
+v1 `SessionInfo` tracked `event_count`, `created_at`, `updated_at`, and full `mcp` config. v1 has session data in the ACP runtime's `MetaSession` struct but no HTTP endpoints to query it. Add HTTP endpoints for session listing and detail.

 ## Current v1 State

@ -117,8 +117,8 @@ fn build_session_info(state: &SessionState) -> SessionInfo {
 ### New HTTP Endpoints

 ```
-GET /v1/sessions              -> SessionListResponse
-GET /v1/sessions/{id}         -> SessionInfo
+session list endpoint         -> SessionListResponse
+session detail endpoint       -> SessionInfo
 ```

 These are control-plane HTTP endpoints (not ACP), providing session visibility without requiring an active ACP connection.
@ -156,7 +156,7 @@ Need to add:

 | File | Change |
 |------|--------|
-| `server/packages/sandbox-agent/src/router.rs` | Add `GET /v1/sessions` and `GET /v1/sessions/{id}` handlers; add response types |
+| `server/packages/sandbox-agent/src/router.rs` | Add session list and session detail handlers; add response types |
 | `server/packages/sandbox-agent/src/acp_runtime/mod.rs` | Add `created_at` to `MetaSession`; add `ended` tracking; expose `list_sessions()` and `get_session()` public methods |
 | `sdks/typescript/src/client.ts` | Add `listSessions()` and `getSession(id)` methods |
 | `server/packages/sandbox-agent/tests/v1_api.rs` | Add session listing and detail tests |
@ -165,6 +165,6 @@ Need to add:

 | Doc | Change |
 |-----|--------|
-| `docs/openapi.json` | Add `/v1/sessions` and `/v1/sessions/{id}` endpoint specs |
+| `docs/openapi.json` | Add session list and session detail endpoint specs |
 | `docs/cli.mdx` | Add CLI `sessions list` and `sessions info` commands |
 | `docs/sdks/typescript.mdx` | Document session listing SDK methods |
--- a/research/acp/missing-features-spec/17-error-termination-metadata.md
+++ b/research/acp/missing-features-spec/17-error-termination-metadata.md
@ -171,7 +171,7 @@ When an agent process terminates with an error:
 ### Session Info Integration

 Termination metadata should be accessible via:
- `GET /v1/sessions/{id}` (Feature #16) — include `terminationInfo` in response when session has ended
+- the session info endpoint (Feature #16) — include `terminationInfo` in response when session has ended
 - `session/list` ACP response — include termination status in session entries

 ### Files to Modify
--- a/research/acp/missing-features-spec/plan.md
+++ b/research/acp/missing-features-spec/plan.md
@ -36,7 +36,7 @@ Session-level features that build on Phase A runtime tracking.

 | Order | Feature                                                      | Spec | Approach                                             | Effort |
 |:-----:|--------------------------------------------------------------|:----:|------------------------------------------------------|:------:|
-| B1    | [Session Info](./16-session-info.md)                         | #16  | New `GET /v1/sessions` and `GET /v1/sessions/{id}`  | Medium |
+| B1    | [Session Info](./16-session-info.md)                         | #16  | New session info HTTP endpoints                     | Medium |
 | B2    | [Session Termination](./07-session-termination.md)           | #7   | Idempotent `_sandboxagent/session/terminate`         | Medium |
 | B3    | [Error Termination Metadata](./17-error-termination-metadata.md) | #17  | Stderr capture + `_sandboxagent/session/ended` event | Medium |

--- a/research/acp/old-rest-openapi-list.md
+++ b/research/acp/old-rest-openapi-list.md
@ -17,16 +17,16 @@
 | /v1/fs/stat | UNIMPLEMENTED |
 | /v1/fs/upload-batch | UNIMPLEMENTED |
 | /v1/health | UNIMPLEMENTED |
-| /v1/sessions | session/list (UNSTABLE) |
-| /v1/sessions/{session_id} | session/new \| session/load \| session/resume (UNSTABLE) |
-| /v1/sessions/{session_id}/events | UNIMPLEMENTED |
-| /v1/sessions/{session_id}/events/sse | session/update (notification stream) |
-| /v1/sessions/{session_id}/messages | session/prompt |
-| /v1/sessions/{session_id}/messages/stream | session/prompt + session/update notifications |
-| /v1/sessions/{session_id}/permissions/{permission_id}/reply | session/request_permission response |
-| /v1/sessions/{session_id}/questions/{question_id}/reject | UNIMPLEMENTED |
-| /v1/sessions/{session_id}/questions/{question_id}/reply | UNIMPLEMENTED |
-| /v1/sessions/{session_id}/terminate | session/cancel (turn cancellation only) |
+| legacy session list route | session/list (UNSTABLE) |
+| legacy session create/load/resume route | session/new \| session/load \| session/resume (UNSTABLE) |
+| legacy session events polling route | UNIMPLEMENTED |
+| legacy session events SSE route | session/update (notification stream) |
+| legacy session prompt route | session/prompt |
+| legacy session prompt + stream route | session/prompt + session/update notifications |
+| legacy permission reply route | session/request_permission response |
+| legacy question reject route | UNIMPLEMENTED |
+| legacy question reply route | UNIMPLEMENTED |
+| legacy session terminate route | session/cancel (turn cancellation only) |
 | AgentCapabilities | initialize.result.agentCapabilities |
 | AgentCapabilities.commandExecution | UNIMPLEMENTED |
 | AgentCapabilities.errorEvents | UNIMPLEMENTED |
@ -427,7 +427,7 @@

 - `UNIMPLEMENTED` means there is no ACP-standard field/method with equivalent semantics in `schema.unstable.json`; implementation would require ACP extension methods (`_...`) and/or `_meta` payloads.
 - Rows mapped to `_meta[...]` are ACP-compatible extensions, not standard interoperable ACP fields; both sides must agree on names and semantics.
- Legacy event polling (`/v1/sessions/{session_id}/events`) has no ACP equivalent; ACP is stream-first via `session/update` notifications over streamable HTTP.
+- Legacy event polling has no ACP equivalent; ACP is stream-first via `session/update` notifications over streamable HTTP.
 - Session lifecycle differs: ACP has `session/new`, `session/load`, `session/resume` (UNSTABLE), and `session/fork` (UNSTABLE), but no standard explicit "close session" method.
 - Permission handling is request/response (`session/request_permission`) tied to JSON-RPC request IDs; it does not use standalone REST reply endpoints.
 - Question/answer HITL flow in the old schema has no standard ACP equivalent today (separate from permission prompts).
--- a/research/acp/spec.md
+++ b/research/acp/spec.md
@ -233,8 +233,6 @@ Non-ACP endpoints retained in v1:
 - `GET /v1/health`
 - `GET /v1/agents` (capabilities + install status)
 - `POST /v1/agents/{agent}/install`
- `GET /v1/sessions`
- `GET /v1/sessions/{id}`
 - `GET /v1/fs/file`
 - `PUT /v1/fs/file`
 - `POST /v1/fs/upload-batch`
--- a/research/acp/v1-schema-to-acp-mapping.md
+++ b/research/acp/v1-schema-to-acp-mapping.md
@ -54,16 +54,16 @@ Extension namespace used in this spec:
 | `POST /v1/fs/move` | `POST /v1/fs/move` | HTTP platform API | Port v1 behavior. |
 | `GET /v1/fs/stat` | `GET /v1/fs/stat` | HTTP platform API | Port v1 behavior. |
 | `POST /v1/fs/upload-batch` | `POST /v1/fs/upload-batch` | HTTP platform API | Tar upload/extract behavior from v1. |
-| `GET /v1/sessions` | `GET /v1/sessions` | HTTP control-plane | Session inventory without ACP connection requirement. |
-| `POST /v1/sessions/{session_id}` | `session/new` | Standard | Path `session_id` becomes alias in `_meta["sandboxagent.dev"].requestedSessionId`. |
-| `POST /v1/sessions/{session_id}/messages` | `session/prompt` | Standard | Asynchronous behavior comes from transport (request + stream). |
-| `POST /v1/sessions/{session_id}/messages/stream` | `session/prompt` + consume `session/update` on SSE | Standard | Streaming is transport-level, not a distinct ACP method. |
-| `POST /v1/sessions/{session_id}/terminate` | `_sandboxagent/session/terminate` | Extension | Idempotent termination semantics distinct from `DELETE /v1/rpc`. |
-| `GET /v1/sessions/{session_id}/events` | `_sandboxagent/session/events` (poll view over ACP stream) | Extension | Optional compatibility helper; canonical v1 is stream consumption. |
-| `GET /v1/sessions/{session_id}/events/sse` | `GET /v1/rpc` SSE stream | Standard transport | Filter by sessionId client-side or via connection/session binding. |
-| `POST /v1/sessions/{session_id}/permissions/{permission_id}/reply` | JSON-RPC response to pending `session/request_permission` request id | Standard | Bridge `permission_id` to request `id` in transport state. |
-| `POST /v1/sessions/{session_id}/questions/{question_id}/reply` | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | ACP stable has no generic question/HITL request method. |
-| `POST /v1/sessions/{session_id}/questions/{question_id}/reject` | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | Encode rejection in response outcome. |
+| legacy session list route | session/list | HTTP control-plane | Session inventory without ACP connection requirement. |
+| legacy session create route | `session/new` | Standard | Path `session_id` becomes alias in `_meta["sandboxagent.dev"].requestedSessionId`. |
+| legacy session prompt route | `session/prompt` | Standard | Asynchronous behavior comes from transport (request + stream). |
+| legacy session prompt + stream route | `session/prompt` + consume `session/update` on SSE | Standard | Streaming is transport-level, not a distinct ACP method. |
+| legacy session terminate route | `_sandboxagent/session/terminate` | Extension | Idempotent termination semantics distinct from `DELETE /v1/rpc`. |
+| legacy event polling route | `_sandboxagent/session/events` (poll view over ACP stream) | Extension | Optional compatibility helper; canonical v1 is stream consumption. |
+| legacy event SSE route | `GET /v1/rpc` SSE stream | Standard transport | Filter by sessionId client-side or via connection/session binding. |
+| legacy permission reply route | JSON-RPC response to pending `session/request_permission` request id | Standard | Bridge `permission_id` to request `id` in transport state. |
+| legacy question reply route | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | ACP stable has no generic question/HITL request method. |
+| legacy question reject route | JSON-RPC response to pending `_sandboxagent/session/request_question` | Extension | Encode rejection in response outcome. |

 ### 3.1 `CreateSessionRequest` field mapping

--- a/scripts/release/update_version.ts
+++ b/scripts/release/update_version.ts
@ -45,7 +45,6 @@ const VERSION_REFERENCE_FILES = [
  "scripts/release/main.ts",
  "scripts/release/promote-artifacts.ts",
  "scripts/release/sdk.ts",
-  "scripts/sandbox-testing/test-sandbox.ts",
 ];

 export async function updateVersion(opts: ReleaseOpts) {
@ -148,7 +147,7 @@ async function updateVersionReferences(opts: ReleaseOpts, oldVersion: string, ol

    const original = content;

-    // Replace minor channel references (e.g. sandbox-agent@0.3.x -> sandbox-agent@0.4.x)
+    // Replace minor channel references (e.g. sandbox-agent@0.5.x -> sandbox-agent@0.5.x)
    content = content.replaceAll(`sandbox-agent@${oldMinorChannel}`, `sandbox-agent@${newMinorChannel}`);
    content = content.replaceAll(`@sandbox-agent/cli@${oldMinorChannel}`, `@sandbox-agent/cli@${newMinorChannel}`);
    content = content.replaceAll(`@sandbox-agent/react@${oldMinorChannel}`, `@sandbox-agent/react@${newMinorChannel}`);
@ -156,6 +155,13 @@ async function updateVersionReferences(opts: ReleaseOpts, oldVersion: string, ol
    // Replace install script URL channel
    content = content.replaceAll(`releases.rivet.dev/sandbox-agent/${oldMinorChannel}/`, `releases.rivet.dev/sandbox-agent/${newMinorChannel}/`);

+    // If references drifted (for example Cargo.toml version was bumped without updating docs),
+    // normalize any other pinned minor-channel references to the release's channel.
+    content = content.replaceAll(/sandbox-agent@0\.\d+\.x/g, `sandbox-agent@${newMinorChannel}`);
+    content = content.replaceAll(/@sandbox-agent\/cli@0\.\d+\.x/g, `@sandbox-agent/cli@${newMinorChannel}`);
+    content = content.replaceAll(/@sandbox-agent\/react@0\.\d+\.x/g, `@sandbox-agent/react@${newMinorChannel}`);
+    content = content.replaceAll(/releases\.rivet\.dev\/sandbox-agent\/0\.\d+\.x\//g, `releases.rivet.dev/sandbox-agent/${newMinorChannel}/`);
+
    // Replace Docker image tags (rivetdev/sandbox-agent:<anything>-full -> rivetdev/sandbox-agent:<version>-full)
    content = content.replaceAll(
      new RegExp(`rivetdev/sandbox-agent:[0-9]+\\.[0-9]+\\.[0-9]+(?:-[a-zA-Z0-9.]+)?-full`, "g"),
@ -174,7 +180,7 @@ async function updateVersionReferences(opts: ReleaseOpts, oldVersion: string, ol
  }

  if (modifiedFiles.length > 0) {
-    await $({ cwd: opts.root })`git add ${modifiedFiles}`;
+    await $({ cwd: opts.root })`git add -f ${modifiedFiles}`;
    console.log(`\nUpdated ${modifiedFiles.length} files with version references.`);
  } else {
    console.log(`\nNo version reference files needed updates.`);
--- a/scripts/sandbox-testing/package.json
+++ b/scripts/sandbox-testing/package.json
@ -1,21 +0,0 @@
-{
-  "name": "@sandbox-agent/testing",
-  "private": true,
-  "type": "module",
-  "scripts": {
-    "test": "tsx test-sandbox.ts",
-    "test:docker": "tsx test-sandbox.ts docker",
-    "test:daytona": "tsx test-sandbox.ts daytona",
-    "test:mock": "tsx test-sandbox.ts docker --agent=mock",
-    "test:verbose": "tsx test-sandbox.ts docker --verbose"
-  },
-  "dependencies": {
-    "@daytonaio/sdk": "latest",
-    "@e2b/code-interpreter": "latest"
-  },
-  "devDependencies": {
-    "@types/node": "latest",
-    "tsx": "latest",
-    "typescript": "latest"
-  }
-}
--- a/scripts/sandbox-testing/test-sandbox.ts
+++ b/scripts/sandbox-testing/test-sandbox.ts
@ -1,720 +0,0 @@
-#!/usr/bin/env npx tsx
-/**
- * Sandbox Testing Script
- *
- * Tests sandbox-agent on various cloud sandbox providers.
- * Usage: npx tsx test-sandbox.ts [provider] [options]
- *
- * Providers: daytona, e2b, docker
- *
- * Options:
- *   --skip-build          Skip cargo build step
- *   --use-release         Use pre-built release binary from releases.rivet.dev
- *   --agent <name>        Test specific agent (claude, codex, mock)
- *   --skip-agent-install  Skip pre-installing agents (tests on-demand install like Daytona example)
- *   --keep-alive          Don't cleanup sandbox after test
- *   --verbose             Show all logs
- */
-
-import { execSync, spawn } from "node:child_process";
-import { existsSync, readFileSync, mkdtempSync, writeFileSync, rmSync } from "node:fs";
-import { homedir, tmpdir } from "node:os";
-import { join, dirname } from "node:path";
-import { fileURLToPath } from "node:url";
-
-const __dirname = dirname(fileURLToPath(import.meta.url));
-const ROOT_DIR = join(__dirname, "../..");
-const SERVER_DIR = join(ROOT_DIR, "server");
-
-// Parse args
-const args = process.argv.slice(2);
-const provider = args.find((a) => !a.startsWith("--")) || "docker";
-const skipBuild = args.includes("--skip-build");
-const useRelease = args.includes("--use-release");
-const skipAgentInstall = args.includes("--skip-agent-install");
-const keepAlive = args.includes("--keep-alive");
-const verbose = args.includes("--verbose");
-const agentArg = args.find((a) => a.startsWith("--agent="))?.split("=")[1];
-
-// Colors
-const log = {
-  info: (msg: string) => console.log(`\x1b[34m[INFO]\x1b[0m ${msg}`),
-  success: (msg: string) => console.log(`\x1b[32m[OK]\x1b[0m ${msg}`),
-  error: (msg: string) => console.log(`\x1b[31m[ERROR]\x1b[0m ${msg}`),
-  warn: (msg: string) => console.log(`\x1b[33m[WARN]\x1b[0m ${msg}`),
-  debug: (msg: string) => verbose && console.log(`\x1b[90m[DEBUG]\x1b[0m ${msg}`),
-  section: (msg: string) => console.log(`\n\x1b[1m=== ${msg} ===\x1b[0m`),
-};
-
-// Credentials extraction using sandbox-agent CLI
-function extractCredentials(): { anthropicApiKey?: string; openaiApiKey?: string } {
-  // First check environment variables
-  const envCreds = {
-    anthropicApiKey: process.env.ANTHROPIC_API_KEY,
-    openaiApiKey: process.env.OPENAI_API_KEY,
-  };
-
-  // If both are set in env, use them
-  if (envCreds.anthropicApiKey && envCreds.openaiApiKey) {
-    return envCreds;
-  }
-
-  // Try to extract using sandbox-agent CLI
-  try {
-    const binaryPath = join(ROOT_DIR, "target/release/sandbox-agent");
-    const debugBinaryPath = join(ROOT_DIR, "target/debug/sandbox-agent");
-    const binary = existsSync(binaryPath) ? binaryPath : existsSync(debugBinaryPath) ? debugBinaryPath : null;
-
-    if (binary) {
-      const output = execSync(`${binary} credentials extract-env --export`, {
-        encoding: "utf-8",
-        stdio: ["pipe", "pipe", "pipe"],
-      });
-
-      // Parse export statements: export KEY="value"
-      for (const line of output.split("\n")) {
-        const match = line.match(/^export (\w+)="(.*)"/);
-        if (match) {
-          const [, key, value] = match;
-          if (key === "ANTHROPIC_API_KEY" && !envCreds.anthropicApiKey) {
-            envCreds.anthropicApiKey = value;
-          } else if (key === "OPENAI_API_KEY" && !envCreds.openaiApiKey) {
-            envCreds.openaiApiKey = value;
-          }
-        }
-      }
-      log.debug(`Extracted credentials via sandbox-agent CLI`);
-    }
-  } catch (err) {
-    log.debug(`Failed to extract credentials via CLI: ${err}`);
-  }
-
-  return envCreds;
-}
-
-function getAnthropicApiKey(): string | undefined {
-  return extractCredentials().anthropicApiKey;
-}
-
-function getOpenAiApiKey(): string | undefined {
-  return extractCredentials().openaiApiKey;
-}
-
-// Build sandbox-agent
-async function buildSandboxAgent(): Promise<string> {
-  log.section("Building sandbox-agent");
-
-  if (useRelease) {
-    log.info("Using pre-built release from releases.rivet.dev");
-    return "RELEASE";
-  }
-
-  // Binary is in workspace root target dir, not server target dir
-  const binaryPath = join(ROOT_DIR, "target/release/sandbox-agent");
-
-  if (skipBuild) {
-    if (!existsSync(binaryPath)) {
-      throw new Error(`Binary not found at ${binaryPath}. Run without --skip-build.`);
-    }
-    log.info(`Using existing binary: ${binaryPath}`);
-    return binaryPath;
-  }
-
-  log.info("Running cargo build --release...");
-  try {
-    execSync("cargo build --release -p sandbox-agent", {
-      cwd: ROOT_DIR,
-      stdio: verbose ? "inherit" : "pipe",
-    });
-    log.success(`Built: ${binaryPath}`);
-    return binaryPath;
-  } catch (err) {
-    throw new Error(`Build failed: ${err}`);
-  }
-}
-
-// Provider interface
-interface SandboxProvider {
-  name: string;
-  requiredEnv: string[];
-  create(opts: { envVars: Record<string, string> }): Promise<Sandbox>;
-}
-
-interface Sandbox {
-  id: string;
-  exec(cmd: string): Promise<{ stdout: string; stderr: string; exitCode: number }>;
-  upload(localPath: string, remotePath: string): Promise<void>;
-  getBaseUrl(port: number): Promise<string>;
-  cleanup(): Promise<void>;
-}
-
-// Docker provider
-// Uses Ubuntu because Claude Code and sandbox-agent are glibc binaries
-const dockerProvider: SandboxProvider = {
-  name: "docker",
-  requiredEnv: [],
-  async create({ envVars }) {
-    const id = `sandbox-test-${Date.now()}`;
-    const envArgs = Object.entries(envVars)
-      .map(([k, v]) => `-e ${k}=${v}`)
-      .join(" ");
-
-    log.info(`Creating Docker container: ${id}`);
-    execSync(`docker run -d --name ${id} ${envArgs} -p 0:3000 ubuntu:22.04 tail -f /dev/null`, { stdio: verbose ? "inherit" : "pipe" });
-
-    // Install dependencies
-    execSync(`docker exec ${id} sh -c "apt-get update && apt-get install -y curl ca-certificates"`, {
-      stdio: verbose ? "inherit" : "pipe",
-    });
-
-    return {
-      id,
-      async exec(cmd) {
-        try {
-          const stdout = execSync(`docker exec ${id} sh -c "${cmd.replace(/"/g, '\\"')}"`, {
-            encoding: "utf-8",
-            stdio: ["pipe", "pipe", "pipe"],
-          });
-          return { stdout, stderr: "", exitCode: 0 };
-        } catch (err: any) {
-          return { stdout: err.stdout || "", stderr: err.stderr || "", exitCode: err.status || 1 };
-        }
-      },
-      async upload(localPath, remotePath) {
-        execSync(`docker cp "${localPath}" ${id}:${remotePath}`, { stdio: verbose ? "inherit" : "pipe" });
-        execSync(`docker exec ${id} chmod +x ${remotePath}`, { stdio: verbose ? "inherit" : "pipe" });
-      },
-      async getBaseUrl(port) {
-        const portMapping = execSync(`docker port ${id} ${port}`, { encoding: "utf-8" }).trim();
-        const hostPort = portMapping.split(":").pop();
-        return `http://localhost:${hostPort}`;
-      },
-      async cleanup() {
-        log.info(`Cleaning up container: ${id}`);
-        execSync(`docker rm -f ${id}`, { stdio: "pipe" });
-      },
-    };
-  },
-};
-
-// Daytona provider
-const daytonaProvider: SandboxProvider = {
-  name: "daytona",
-  requiredEnv: ["DAYTONA_API_KEY"],
-  async create({ envVars }) {
-    const { Daytona } = await import("@daytonaio/sdk");
-    const daytona = new Daytona();
-
-    log.info("Creating Daytona sandbox...");
-    // NOTE: Tier 1/2 sandboxes have restricted network that cannot be overridden
-    // networkAllowList requires CIDR notation (IP ranges), not domain names
-    const sandbox = await daytona.create({
-      image: "ubuntu:22.04",
-      envVars,
-    });
-    const id = sandbox.id;
-
-    // Install curl
-    await sandbox.process.executeCommand("apt-get update && apt-get install -y curl ca-certificates");
-
-    return {
-      id,
-      async exec(cmd) {
-        const result = await sandbox.process.executeCommand(cmd);
-        // Daytona SDK returns: { exitCode, result: string, artifacts: { stdout: string } }
-        return {
-          stdout: result.result || "",
-          stderr: "",
-          exitCode: result.exitCode ?? 0,
-        };
-      },
-      async upload(localPath, remotePath) {
-        const content = readFileSync(localPath);
-        // Daytona SDK signature: uploadFile(Buffer, remotePath)
-        await sandbox.fs.uploadFile(content, remotePath);
-        await sandbox.process.executeCommand(`chmod +x ${remotePath}`);
-      },
-      async getBaseUrl(port) {
-        const preview = await sandbox.getSignedPreviewUrl(port, 4 * 60 * 60);
-        return preview.url;
-      },
-      async cleanup() {
-        log.info(`Cleaning up Daytona sandbox: ${id}`);
-        await sandbox.delete(60);
-      },
-    };
-  },
-};
-
-// E2B provider
-const e2bProvider: SandboxProvider = {
-  name: "e2b",
-  requiredEnv: ["E2B_API_KEY"],
-  async create({ envVars }) {
-    const { Sandbox } = await import("@e2b/code-interpreter");
-
-    log.info("Creating E2B sandbox...");
-    let sandbox;
-    try {
-      sandbox = await Sandbox.create({
-        allowInternetAccess: true,
-        envs: envVars,
-      });
-    } catch (err: any) {
-      log.error(`E2B sandbox creation failed: ${err.message || err}`);
-      throw err;
-    }
-    const id = sandbox.sandboxId;
-
-    // Install curl (E2B uses Debian which has glibc, sandbox-agent will auto-detect)
-    const installResult = await sandbox.commands.run("sudo apt-get update && sudo apt-get install -y curl ca-certificates");
-    log.debug(`Install output: ${installResult.stdout} ${installResult.stderr}`);
-
-    return {
-      id,
-      async exec(cmd) {
-        const result = await sandbox.commands.run(cmd);
-        return {
-          stdout: result.stdout || "",
-          stderr: result.stderr || "",
-          exitCode: result.exitCode,
-        };
-      },
-      async upload(localPath, remotePath) {
-        const content = readFileSync(localPath);
-        await sandbox.files.write(remotePath, content);
-        await sandbox.commands.run(`chmod +x ${remotePath}`);
-      },
-      async getBaseUrl(port) {
-        return `https://${sandbox.getHost(port)}`;
-      },
-      async cleanup() {
-        log.info(`Cleaning up E2B sandbox: ${id}`);
-        await sandbox.kill();
-      },
-    };
-  },
-};
-
-// Get provider
-function getProvider(name: string): SandboxProvider {
-  switch (name) {
-    case "docker":
-      return dockerProvider;
-    case "daytona":
-      return daytonaProvider;
-    case "e2b":
-      return e2bProvider;
-    default:
-      throw new Error(`Unknown provider: ${name}. Available: docker, daytona, e2b`);
-  }
-}
-
-// Install sandbox-agent in sandbox
-async function installSandboxAgent(sandbox: Sandbox, binaryPath: string): Promise<void> {
-  log.section("Installing sandbox-agent");
-
-  if (binaryPath === "RELEASE") {
-    log.info("Installing from releases.rivet.dev...");
-    const result = await sandbox.exec("curl -fsSL https://releases.rivet.dev/sandbox-agent/0.3.x/install.sh | sh");
-    log.debug(`Install output: ${result.stdout}`);
-    if (result.exitCode !== 0) {
-      throw new Error(`Install failed: ${result.stderr}`);
-    }
-  } else {
-    log.info(`Uploading local binary: ${binaryPath}`);
-    await sandbox.upload(binaryPath, "/usr/local/bin/sandbox-agent");
-  }
-
-  // Verify installation
-  const version = await sandbox.exec("sandbox-agent --version");
-  log.success(`Installed: ${version.stdout.trim()}`);
-}
-
-// Install agents
-async function installAgents(sandbox: Sandbox, agents: string[]): Promise<void> {
-  log.section("Installing agents");
-
-  for (const agent of agents) {
-    log.info(`Installing ${agent}...`);
-
-    if (agent === "claude" || agent === "codex") {
-      const result = await sandbox.exec(`sandbox-agent install-agent ${agent}`);
-      if (result.exitCode !== 0) throw new Error(`Failed to install ${agent}: ${result.stderr}`);
-      log.success(`Installed ${agent}`);
-    } else if (agent === "mock") {
-      // Mock agent is built into sandbox-agent, no install needed
-      log.info("Mock agent is built-in, skipping install");
-    }
-  }
-}
-
-// Start server and check health
-async function startServerAndCheckHealth(sandbox: Sandbox): Promise<string> {
-  log.section("Starting server");
-
-  // Start server in background
-  await sandbox.exec("nohup sandbox-agent server --no-token --host 0.0.0.0 --port 3000 >/tmp/sandbox-agent.log 2>&1 &");
-  log.info("Server started in background");
-
-  // Get base URL
-  const baseUrl = await sandbox.getBaseUrl(3000);
-  log.info(`Base URL: ${baseUrl}`);
-
-  // Wait for health
-  log.info("Waiting for health check...");
-  for (let i = 0; i < 30; i++) {
-    try {
-      const response = await fetch(`${baseUrl}/v1/health`);
-      if (response.ok) {
-        const data = await response.json();
-        if (data.status === "ok") {
-          log.success("Health check passed!");
-          return baseUrl;
-        }
-      }
-    } catch {}
-    await new Promise((r) => setTimeout(r, 1000));
-  }
-
-  // Show logs on failure
-  const logs = await sandbox.exec("cat /tmp/sandbox-agent.log");
-  log.error("Server logs:\n" + logs.stdout);
-  throw new Error("Health check failed after 30 seconds");
-}
-
-// Send a message and wait for response, auto-approving permissions
-// Returns the response text
-async function sendMessage(baseUrl: string, sessionId: string, message: string): Promise<string> {
-  log.info(`Sending message: "${message.slice(0, 60)}${message.length > 60 ? "..." : ""}"`);
-  const msgRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}/messages/stream`, {
-    method: "POST",
-    headers: { "Content-Type": "application/json" },
-    body: JSON.stringify({ message }),
-  });
-  if (!msgRes.ok || !msgRes.body) {
-    throw new Error(`Failed to send message: ${await msgRes.text()}`);
-  }
-
-  // Process SSE stream
-  const reader = msgRes.body.getReader();
-  const decoder = new TextDecoder();
-  let buffer = "";
-  let responseText = "";
-  let receivedText = false;
-  let hasError = false;
-  let errorMessage = "";
-  let pendingPermission: string | null = null;
-
-  while (true) {
-    const { done, value } = await reader.read();
-    if (done) break;
-
-    buffer += decoder.decode(value, { stream: true });
-    const lines = buffer.split("\n");
-    buffer = lines.pop() || "";
-
-    for (const line of lines) {
-      if (!line.startsWith("data: ")) continue;
-      const data = line.slice(6);
-      if (data === "[DONE]") continue;
-
-      try {
-        const event = JSON.parse(data);
-        log.debug(`Event: ${event.type}`);
-
-        if (event.type === "item.delta") {
-          const delta = event.data?.delta;
-          const text = typeof delta === "string" ? delta : delta?.text || "";
-          if (text) {
-            if (!receivedText) {
-              log.info("Receiving response...");
-              receivedText = true;
-            }
-            process.stdout.write(text);
-            responseText += text;
-          }
-        }
-
-        // Handle permission requests - auto-approve
-        if (event.type === "permission.requested") {
-          const permissionId = event.data?.permission_id;
-          if (permissionId) {
-            pendingPermission = permissionId;
-            log.info(`Permission requested (${permissionId}), auto-approving...`);
-          }
-        }
-
-        if (event.type === "error") {
-          hasError = true;
-          errorMessage = event.data?.message || JSON.stringify(event.data);
-          log.error(`Error event: ${errorMessage}`);
-        }
-
-        if (event.type === "agent.unparsed") {
-          hasError = true;
-          errorMessage = `Agent unparsed: ${JSON.stringify(event.data)}`;
-          log.error(errorMessage);
-        }
-      } catch {}
-    }
-
-    // If we have a pending permission, approve it
-    if (pendingPermission) {
-      const permId = pendingPermission;
-      pendingPermission = null;
-      try {
-        const approveRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}/permissions/${permId}/reply`, {
-          method: "POST",
-          headers: { "Content-Type": "application/json" },
-          body: JSON.stringify({ reply: "once" }),
-        });
-        if (approveRes.ok) {
-          log.success(`Permission ${permId} approved`);
-        } else {
-          log.warn(`Failed to approve permission: ${await approveRes.text()}`);
-        }
-      } catch (err) {
-        log.warn(`Error approving permission: ${err}`);
-      }
-    }
-  }
-
-  if (receivedText) {
-    console.log(); // newline after response
-  }
-
-  if (hasError) {
-    throw new Error(`Agent returned error: ${errorMessage}`);
-  }
-
-  return responseText;
-}
-
-// Test agent interaction
-async function testAgent(baseUrl: string, agent: string, message: string): Promise<void> {
-  log.section(`Testing ${agent} agent`);
-
-  const sessionId = crypto.randomUUID();
-
-  // Create session
-  log.info(`Creating session ${sessionId}...`);
-  const createRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}`, {
-    method: "POST",
-    headers: { "Content-Type": "application/json" },
-    body: JSON.stringify({ agent }),
-  });
-  if (!createRes.ok) {
-    throw new Error(`Failed to create session: ${await createRes.text()}`);
-  }
-  log.success("Session created");
-
-  const response = await sendMessage(baseUrl, sessionId, message);
-  if (!response) {
-    throw new Error("No response received from agent");
-  }
-  log.success("Received response from agent");
-}
-
-// Test that agent can actually modify files and run commands
-async function testAgentActions(baseUrl: string, agent: string, sandbox: Sandbox): Promise<void> {
-  log.section(`Testing ${agent} agent actions (file + command)`);
-
-  const sessionId = crypto.randomUUID();
-  const testFile = "/tmp/sandbox-test-file.txt";
-  const expectedContent = "Hello from sandbox test!";
-
-  // For Claude running as root in containers, we must use default permission mode
-  // and handle permissions via the API (bypass mode is not supported as root).
-  // For other agents, we can use bypass mode.
-  const permissionMode = agent === "claude" ? "default" : "bypass";
-  log.info(`Creating session ${sessionId} with permissionMode=${permissionMode}...`);
-  const createRes = await fetch(`${baseUrl}/v1/sessions/${sessionId}`, {
-    method: "POST",
-    headers: { "Content-Type": "application/json" },
-    body: JSON.stringify({ agent, permissionMode }),
-  });
-  if (!createRes.ok) {
-    throw new Error(`Failed to create session: ${await createRes.text()}`);
-  }
-  log.success("Session created");
-
-  // Ask agent to create a file
-  const fileMessage = `Create a file at ${testFile} with exactly this content (no quotes, no extra text): ${expectedContent}`;
-  await sendMessage(baseUrl, sessionId, fileMessage);
-
-  // Wait for agent to complete action after permission approval
-  log.info("Waiting for agent to complete action...");
-  await new Promise((r) => setTimeout(r, 5000));
-
-  // Verify file was created
-  log.info("Verifying file was created...");
-  const fileCheck = await sandbox.exec(`cat ${testFile} 2>&1`);
-  if (fileCheck.exitCode !== 0) {
-    throw new Error(`File was not created: ${fileCheck.stderr || fileCheck.stdout}`);
-  }
-  if (!fileCheck.stdout.includes("Hello from sandbox test")) {
-    throw new Error(`File content mismatch. Expected "${expectedContent}", got "${fileCheck.stdout.trim()}"`);
-  }
-  log.success(`File created with correct content: "${fileCheck.stdout.trim()}"`);
-
-  // Ask agent to run a command and create output
-  const cmdMessage = `Run this command and tell me the output: echo "command-test-$(date +%s)" > /tmp/cmd-output.txt && cat /tmp/cmd-output.txt`;
-  await sendMessage(baseUrl, sessionId, cmdMessage);
-
-  // Verify command was executed
-  log.info("Verifying command was executed...");
-  const cmdCheck = await sandbox.exec("cat /tmp/cmd-output.txt 2>&1");
-  if (cmdCheck.exitCode !== 0) {
-    throw new Error(`Command output file not found: ${cmdCheck.stderr || cmdCheck.stdout}`);
-  }
-  if (!cmdCheck.stdout.includes("command-test-")) {
-    throw new Error(`Command output mismatch. Expected "command-test-*", got "${cmdCheck.stdout.trim()}"`);
-  }
-  log.success(`Command executed successfully: "${cmdCheck.stdout.trim()}"`);
-}
-
-// Check environment diagnostics
-async function checkEnvironment(sandbox: Sandbox): Promise<void> {
-  log.section("Environment diagnostics");
-
-  const checks = [
-    { name: "Environment variables", cmd: "env | grep -E 'ANTHROPIC|OPENAI|CLAUDE|CODEX' | sed 's/=.*/=<set>/'" },
-    // Check both /root (Alpine) and /home/user (E2B/Debian) paths
-    {
-      name: "Agent binaries",
-      cmd: "ls -la ~/.local/share/sandbox-agent/bin/ 2>/dev/null || ls -la /root/.local/share/sandbox-agent/bin/ 2>/dev/null || ls -la /home/user/.local/share/sandbox-agent/bin/ 2>/dev/null || echo 'No agents installed'",
-    },
-    {
-      name: "Claude version",
-      cmd: "~/.local/share/sandbox-agent/bin/claude --version 2>&1 || /root/.local/share/sandbox-agent/bin/claude --version 2>&1 || echo 'Claude not installed'",
-    },
-    { name: "sandbox-agent version", cmd: "sandbox-agent --version 2>/dev/null || echo 'Not installed'" },
-    { name: "Server process", cmd: "pgrep -a sandbox-agent 2>/dev/null || ps aux | grep sandbox-agent | grep -v grep || echo 'Not running'" },
-    { name: "Server logs (last 50 lines)", cmd: "tail -50 /tmp/sandbox-agent.log 2>/dev/null || echo 'No logs'" },
-    {
-      name: "Network: api.anthropic.com",
-      cmd: "curl -s -o /dev/null -w '%{http_code}' --connect-timeout 5 https://api.anthropic.com/v1/messages 2>&1 || echo 'UNREACHABLE'",
-    },
-    {
-      name: "Network: api.openai.com",
-      cmd: "curl -s -o /dev/null -w '%{http_code}' --connect-timeout 5 https://api.openai.com/v1/models 2>&1 || echo 'UNREACHABLE'",
-    },
-  ];
-
-  for (const { name, cmd } of checks) {
-    const result = await sandbox.exec(cmd);
-    console.log(`\n\x1b[1m${name}:\x1b[0m`);
-    console.log(result.stdout || "(empty)");
-    if (result.stderr) console.log(`stderr: ${result.stderr}`);
-  }
-}
-
-// Main
-async function main() {
-  log.section(`Sandbox Testing (provider: ${provider})`);
-
-  // Check credentials
-  const anthropicKey = getAnthropicApiKey();
-  const openaiKey = getOpenAiApiKey();
-
-  log.info(`Anthropic API key: ${anthropicKey ? "found" : "not found"}`);
-  log.info(`OpenAI API key: ${openaiKey ? "found" : "not found"}`);
-
-  // Determine which agents to test
-  let agents: string[];
-  if (agentArg) {
-    agents = [agentArg];
-  } else if (anthropicKey) {
-    agents = ["claude"];
-  } else if (openaiKey) {
-    agents = ["codex"];
-  } else {
-    agents = ["mock"];
-    log.warn("No API keys found, using mock agent only");
-  }
-  log.info(`Agents to test: ${agents.join(", ")}`);
-
-  // Get provider
-  const prov = getProvider(provider);
-
-  // Check required env vars
-  for (const envVar of prov.requiredEnv) {
-    if (!process.env[envVar]) {
-      throw new Error(`Missing required environment variable: ${envVar}`);
-    }
-  }
-
-  // Build
-  const binaryPath = await buildSandboxAgent();
-
-  // Create sandbox
-  log.section(`Creating ${prov.name} sandbox`);
-  const envVars: Record<string, string> = {};
-  if (anthropicKey) envVars.ANTHROPIC_API_KEY = anthropicKey;
-  if (openaiKey) envVars.OPENAI_API_KEY = openaiKey;
-
-  const sandbox = await prov.create({ envVars });
-  log.success(`Created sandbox: ${sandbox.id}`);
-
-  try {
-    // Install sandbox-agent
-    await installSandboxAgent(sandbox, binaryPath);
-
-    // Install agents (unless --skip-agent-install to test on-demand install like Daytona example)
-    if (skipAgentInstall) {
-      log.info("Skipping agent pre-install (testing on-demand installation)");
-    } else {
-      await installAgents(sandbox, agents);
-    }
-
-    // Check environment
-    await checkEnvironment(sandbox);
-
-    // Start server and check health
-    const baseUrl = await startServerAndCheckHealth(sandbox);
-
-    // Test each agent
-    for (const agent of agents) {
-      // Basic response test
-      const message = agent === "mock" ? "hello" : "Say hello in 10 words or less";
-      await testAgent(baseUrl, agent, message);
-
-      // For real agents, also test file/command actions with permission handling.
-      // Claude uses default permission mode and we auto-approve via API.
-      // Other agents can use bypass mode.
-      if (agent !== "mock") {
-        await testAgentActions(baseUrl, agent, sandbox);
-      }
-    }
-
-    log.section("All tests passed!");
-
-    if (keepAlive) {
-      log.info(`Sandbox ${sandbox.id} is still running. Press Ctrl+C to cleanup.`);
-      log.info(`Base URL: ${await sandbox.getBaseUrl(3000)}`);
-      await new Promise(() => {}); // Wait forever
-    }
-  } catch (err) {
-    log.error(`Test failed: ${err}`);
-
-    // Show diagnostics on failure
-    try {
-      await checkEnvironment(sandbox);
-    } catch {}
-
-    if (!keepAlive) {
-      await sandbox.cleanup();
-    }
-    process.exit(1);
-  }
-
-  if (!keepAlive) {
-    await sandbox.cleanup();
-  }
-}
-
-main().catch((err) => {
-  log.error(err.message || err);
-  process.exit(1);
-});
--- a/sdks/acp-http-client/package.json
+++ b/sdks/acp-http-client/package.json
@ -1,6 +1,6 @@
 {
  "name": "acp-http-client",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "Protocol-faithful ACP JSON-RPC over streamable HTTP client.",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli-shared/package.json
+++ b/sdks/cli-shared/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-shared",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "Shared helpers for sandbox-agent CLI and SDK",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/package.json
+++ b/sdks/cli/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "CLI for sandbox-agent - run AI coding agents in sandboxes",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/darwin-arm64/package.json
+++ b/sdks/cli/platforms/darwin-arm64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-darwin-arm64",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "sandbox-agent CLI binary for macOS ARM64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/darwin-x64/package.json
+++ b/sdks/cli/platforms/darwin-x64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-darwin-x64",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "sandbox-agent CLI binary for macOS x64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/linux-arm64/package.json
+++ b/sdks/cli/platforms/linux-arm64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-linux-arm64",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "sandbox-agent CLI binary for Linux arm64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/linux-x64/package.json
+++ b/sdks/cli/platforms/linux-x64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-linux-x64",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "sandbox-agent CLI binary for Linux x64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/cli/platforms/win32-x64/package.json
+++ b/sdks/cli/platforms/win32-x64/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/cli-win32-x64",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "sandbox-agent CLI binary for Windows x64",
  "license": "Apache-2.0",
  "repository": {
--- a/sdks/gigacode/package.json
+++ b/sdks/gigacode/package.json
@ -1,6 +1,6 @@
 {
  "name": "@sandbox-agent/gigacode",
-  "version": "0.5.0-rc.1",
+  "version": "0.4.2",
  "description": "Gigacode CLI (sandbox-agent with OpenCode attach by default)",
  "license": "Apache-2.0",
  "repository": {
--- a/Show more
+++ b/Show more
Author	SHA1	Message	Date
Nathan Flurry	bf484e7c96	docs: clean up orphaned docs and add session event types Delete orphaned docs not in docs.json navigation (gigacode.mdx, foundry-self-hosting.mdx, session-transcript-schema.mdx, pi-support-plan.md). Remove outdated musl/glibc troubleshooting section. Add event types documentation with example payloads to agent-sessions.mdx. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>	2026-03-25 19:11:19 -07:00
Nathan Flurry	d55b0dfb88	chore(release): update version to 0.4.2	2026-03-25 18:07:26 -07:00
ABC	251f731232	Merge pull request #284 from rivet-dev/03-25-fix_mock_pass_sandbox_agent_bin_to_mock_agent_launcher fix(mock): pass SANDBOX_AGENT_BIN to mock agent launcher	2026-03-25 17:00:51 -04:00
abcxff	b45989a082	fix(mock): pass SANDBOX_AGENT_BIN to mock agent launcher	2026-03-25 16:54:40 -04:00
Nathan Flurry	78e84281e8	chore(release): update version to 0.4.1	2026-03-25 13:20:57 -07:00
Nathan Flurry	5da35e6dfa	feat: sprites support	2026-03-25 12:23:14 -07:00
ABC	9cd9252725	Merge pull request #283 from rivet-dev/03-25-chore_providers_move_back_to_0.4.x_install_script chore(providers): sync install script with latest 0.4.x	2026-03-25 14:24:55 -04:00
abcxff	858b9a4d2f	chore(providers): move back to 0.4.x install script	2026-03-25 14:22:57 -04:00
Nathan Flurry	4fa28061e9	Merge pull request #279 from rivet-dev/NicholasKissel/docs-dark-theme fix(docs): restore dark theme styling	2026-03-24 23:26:28 -07:00
ABCxFF	cb42971b56	chore(release): update version to 0.5.0-rc.2	2026-03-25 05:13:47 +00:00
ABC	e9fabbfe64	fix: surface agent stderr in RPC errors & add defaultCwd param (#278 )	2026-03-25 00:49:35 -04:00
ABC	32dd5914ed	Merge pull request #269 from rivet-dev/e2b-base-image-support feat(providers): add base image support and improve forward compatibility	2026-03-25 00:42:49 -04:00
ABC	fe8fbfc91c	Merge branch 'main' into e2b-base-image-support	2026-03-25 00:37:58 -04:00
Nicholas Kissel	32713ff453	fix(docs): keep dark mode strict appearance Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-03-24 21:33:10 -07:00
abcxff	833b57deb1	fix: surface agent stderr in RPC errors and default cwd for remote providers	2026-03-25 04:26:48 +00:00
Nicholas Kissel	927e77c7e2	fix(docs): restore dark theme styling with custom CSS Re-enable theme.css with full custom styling (links, inputs, cards, code blocks, alerts) and update docs.json color values. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-03-24 21:25:06 -07:00
Nathan Flurry	f353e39fc6	Merge pull request #273 from Crunchyman-ralph/fix/update-install-script-to-0.4.x fix: update install script URL from 0.3.x to 0.4.x	2026-03-19 12:45:00 -07:00
Ralph Khreish	3525dcc315	fix: update install script URL from 0.3.x to 0.4.x The E2B and Vercel providers install sandbox-agent 0.3.x inside sandboxes while the SDK client speaks 0.4.0 ACP protocol, causing AcpRpcError -32603. Fixes #272	2026-03-19 17:45:16 +01:00
Nathan Flurry	7b23e519c2	fix(foundry): add Bun idleTimeout safety net and subscription retry with backoff Bun.serve() defaults to a 10s idle timeout that can kill long-running requests. Actor RPCs go through the gateway tunnel with a 1s SSE ping, so this likely never fires, but set idleTimeout to 255 as a safety net. Subscription topics (app, org, session, task) previously had no retry mechanism. If the initial connection or a mid-session error occurred, the subscription stayed in error state permanently. Add exponential backoff retry (1s base, 30s max) that cleans up the old connection before each attempt and stops when disposed or no listeners remain. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>	2026-03-17 18:35:36 -07:00
Nathan Flurry	bea3b58199	fix(foundry): use $HOME instead of hardcoded /home/sandbox for sandbox repo paths E2B sandboxes run as `user` (home: /home/user), not `sandbox`, so `mkdir -p /home/sandbox` fails with "Permission denied". Replace all hardcoded `/home/sandbox` paths with `$HOME` resolved at shell runtime inside the sandbox, and dynamically resolve the repo CWD via the sandbox actor so it works across providers (E2B, local Docker, Daytona). Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>	2026-03-17 17:33:53 -07:00
Nathan Flurry	524f40ec02	feat(providers): simplify modal to use published base image The `-full` base image already includes sandbox-agent and all agents pre-installed. Remove redundant apt-get, install script, and install-agent dockerfile commands from the Modal provider. Also allow overriding the default image via SANDBOX_AGENT_IMAGE env var across all providers for testing with different published versions. Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>	2026-03-17 16:54:20 -07:00
Nathan Flurry	4e76038a0d	feat(providers): add base image support and improve forward compatibility Add support for configuring base images across all compute providers: - E2B: Accept optional `template` parameter to select custom templates - Modal: Accept optional `image` parameter (string or Image object) for base images - ComputeSDK: Expand `create` override to accept full CreateSandboxOptions payload (image, templateId, etc.) - Daytona: Improve type safety for `image` option Improve forward compatibility by making all `create` overrides accept full Partial SDK types, allowing any new provider fields to flow through without code changes. Fix Modal provider bug where `encryptedPorts` was hardcoded and would clobber user-provided values; now merges additional ports instead. Update docs and examples to demonstrate base image configuration for E2B, Modal, and ComputeSDK. Add comprehensive provider lifecycle tests for Modal and ComputeSDK, including template and image passthrough verification. Co-Authored-By: Claude Haiku 4.5 <noreply@anthropic.com>	2026-03-17 15:25:21 -07:00
Nathan Flurry	ffb9f1082b	fix(foundry): fix runner version	2026-03-17 14:33:13 -07:00