feat: add raw session args/opts for agent passthrough

2026-04-15 09:01:17 +00:00 · 2026-02-05 11:32:39 -08:00 · 2026-02-05 11:32:39 -08:00 · 2f26f76d9b
commit 2f26f76d9b
parent 375d73e4cb
14 changed files with 365 additions and 37 deletions
--- a/docs/openapi.json
+++ b/docs/openapi.json
@ -669,7 +669,9 @@
          "mcpTools",
          "streamingDeltas",
          "itemStarted",
-          "sharedProcess"
+          "sharedProcess",
          "rawSessionArgs",
          "rawSessionOptions"
        ],
        "properties": {
          "commandExecution": {
@ -702,6 +704,14 @@
          "questions": {
            "type": "boolean"
          },
          "rawSessionArgs": {
            "type": "boolean",
            "description": "Whether this agent supports raw CLI arguments passed at session creation"
          },
          "rawSessionOptions": {
            "type": "boolean",
            "description": "Whether this agent supports raw options passed at session creation"
          },
          "reasoning": {
            "type": "boolean"
          },
@ -1074,6 +1084,20 @@
          "variant": {
            "type": "string",
            "nullable": true
          },
          "rawSessionArgs": {
            "type": "array",
            "items": {
              "type": "string"
            },
            "nullable": true,
            "description": "Raw CLI arguments to pass to the agent (for CLI-based agents like Claude, OpenCode, Amp)"
          },
          "rawSessionOptions": {
            "type": "object",
            "additionalProperties": true,
            "nullable": true,
            "description": "Raw options to pass to the agent (for long-running server agents like Codex)"
          }
        }
      },
--- a/docs/sdks/typescript.mdx
+++ b/docs/sdks/typescript.mdx
@ -62,6 +62,26 @@ await client.createSession("demo-session", {
 await client.postMessage("demo-session", { message: "Hello" });
 ```
 ### Raw session arguments
 Pass low-level arguments directly to agents at session creation:
 ```ts
 // CLI args for Claude, OpenCode, Amp (not Codex)
 await client.createSession("my-session", {
  agent: "claude",
  rawSessionArgs: ["--max-turns", "5"],
 });
 // Options passed through agent's native protocol (long-running servers only)
 await client.createSession("my-session", {
  agent: "codex",
  rawSessionOptions: { sandbox: "workspace-write" },
 });
 ```
 Check `capabilities.rawSessionArgs` and `capabilities.rawSessionOptions` to see what each agent supports.
 List agents and inspect feature coverage (available on `capabilities`):
 ```ts
--- a/docs/session-transcript-schema.mdx
+++ b/docs/session-transcript-schema.mdx
@ -29,6 +29,8 @@ This table shows which agent feature coverage appears in the universal event str
 | File Changes       |   -    |   ✓   |      -       |      -       |
 | MCP Tools          |   -    |   ✓   |      -       |      -       |
 | Streaming Deltas   |   ✓    |   ✓   |      ✓       |      -       |
 | Raw Session Args   |   ✓    |       |      ✓       |      ✓       |
 | Raw Session Options|   ✓    |   ✓   |      ✓       |      ✓       |
 Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview) · [Codex](https://github.com/openai/codex) · [OpenCode](https://github.com/opencode-ai/opencode) · [Amp](https://ampcode.com)
@ -76,6 +78,12 @@ Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude
  <Accordion title="Streaming Deltas">
    Native streaming of content deltas. When not supported, the daemon emits a single synthetic delta before `item.completed`.
  </Accordion>
  <Accordion title="Raw Session Args">
    Pass raw CLI arguments directly to the agent at session creation via `rawSessionArgs`. Only supported for CLI-based agents (Claude, OpenCode, Amp). Codex uses JSON-RPC, so CLI args are not applicable.
  </Accordion>
  <Accordion title="Raw Session Options">
    Pass raw options to the agent at session creation via `rawSessionOptions`. For long-running server agents, options are passed through the agent's native protocol. For Codex, options are merged into the `thread/start` config.
  </Accordion>
 </AccordionGroup>
 Want support for another agent? [Open an issue](https://github.com/rivet-dev/sandbox-agent/issues/new) to request it.
--- a/research/agents/amp.md
+++ b/research/agents/amp.md
@ -25,16 +25,32 @@ amp --print --output-format stream-json --dangerously-skip-permissions "prompt"
 amp --continue SESSION_ID "follow up"
 ```
-### Key CLI Flags
+### Custom Args (CLI Flags)
-| Flag | Description |
+#### Core Flags
-|------|-------------|
+
-| `--print` | Output mode (non-interactive) |
+| Flag | Type | Description |
-| `--output-format stream-json` | JSONL streaming output |
+|------|------|-------------|
-| `--dangerously-skip-permissions` | Skip permission prompts |
+| `--print` | bool | Output mode (non-interactive) |
-| `--continue SESSION_ID` | Resume existing session |
+| `--execute` | bool | Alternative output mode (some versions) |
-| `--model MODEL` | Specify model |
+| `--output-format stream-json` | string | JSONL streaming output |
-| `--toolbox TOOLBOX` | Toolbox configuration |
+| `--model MODEL` | string | Specify model to use |
 | `--continue SESSION_ID` | string | Resume existing session |
 #### Permission Flags
 | Flag | Type | Description |
 |------|------|-------------|
 | `--dangerously-skip-permissions` | bool | Skip all permission prompts |
 #### Configuration Flags
 | Flag | Type | Description |
 |------|------|-------------|
 | `--toolbox NAME` | string | Toolbox configuration to use |
 | `--mcp-config FILE` | path | Path to MCP configuration file |
 **Note:** Amp CLI flags vary by version. The daemon uses flag detection (`amp --help`) to determine which flags are supported before invocation.
 ## Credential Discovery
--- a/research/agents/claude.md
+++ b/research/agents/claude.md
@ -71,17 +71,42 @@ claude \
  "PROMPT"
 ```
-### Arguments
+### Core Arguments
 | Flag | Description |
 |------|-------------|
-| `--print` | Output mode |
+| `--print` | Output mode (non-interactive) |
 | `--output-format stream-json` | Newline-delimited JSON streaming |
 | `--verbose` | Verbose output |
 | `--dangerously-skip-permissions` | Skip permission prompts |
 | `--resume SESSION_ID` | Resume existing session |
 | `--model MODEL_ID` | Specify model (e.g., `claude-sonnet-4-20250514`) |
-| `--permission-mode plan` | Plan mode (read-only exploration) |
+| `--permission-mode MODE` | Permission mode (`plan`, `acceptEdits`) |
 ### Custom Args (Session Configuration)
 These flags can be passed to customize agent behavior at session start:
 | Flag | Type | Description |
 |------|------|-------------|
 | `--max-turns N` | int | Maximum number of agent turns before stopping |
 | `--system-prompt TEXT` | string | Custom system prompt (replaces default) |
 | `--append-system-prompt TEXT` | string | Text to append to the system prompt |
 | `--allowed-tools TOOLS` | string (comma-sep) | Comma-separated list of allowed tools |
 | `--disallowed-tools TOOLS` | string (comma-sep) | Comma-separated list of disallowed tools |
 | `--mcp-server NAME` | string | Add an MCP server by name |
 | `--timeout-secs N` | int | Timeout in seconds (overrides default 300s) |
 | `--profile NAME` | string | Use a specific configuration profile |
 ### Streaming Input Mode Flags
 When using `--input-format stream-json` for streaming input:
 | Flag | Description |
 |------|-------------|
 | `--input-format stream-json` | Accept streaming JSON input via stdin |
 | `--permission-prompt-tool stdio` | Handle permission prompts via stdio |
 | `--include-partial-messages` | Include partial message events in output |
 ### Environment Variables
--- a/research/agents/codex.md
+++ b/research/agents/codex.md
@ -41,17 +41,54 @@ codex exec --dangerously-bypass-approvals-and-sandbox "prompt"
 codex exec resume --last  # Resume previous session
 ```
-### Key CLI Flags
+### Custom Args (CLI Flags)
-| Flag | Description |
+
-|------|-------------|
+#### Core Flags
-| `--json` | Print events to stdout as JSONL |
+
-| `-m, --model MODEL` | Model to use |
+| Flag | Type | Description |
-| `-s, --sandbox MODE` | `read-only`, `workspace-write`, `danger-full-access` |
+|------|------|-------------|
-| `--full-auto` | Auto-approve with workspace-write sandbox |
+| `-m, --model MODEL` | string | Model to use (e.g., `o3`, `gpt-4o`) |
-| `--dangerously-bypass-approvals-and-sandbox` | Skip all prompts (dangerous) |
+| `--json` | bool | Print events to stdout as JSONL |
-| `-C, --cd DIR` | Working directory |
+| `-C, --cd DIR` | path | Working directory for the agent |
-| `-o, --output-last-message FILE` | Write final response to file |
+| `-o, --output-last-message FILE` | path | Write final response to file |
-| `--output-schema FILE` | JSON Schema for structured output |
+
 #### Permission & Sandbox Flags
 | Flag | Type | Values | Description |
 |------|------|--------|-------------|
 | `-s, --sandbox MODE` | enum | `read-only`, `workspace-write`, `danger-full-access` | Sandbox policy for shell commands |
 | `-a, --ask-for-approval POLICY` | enum | `untrusted`, `on-failure`, `on-request`, `never` | When to require human approval |
 | `--full-auto` | bool | - | Convenience alias: `-a on-request --sandbox workspace-write` |
 | `--dangerously-bypass-approvals-and-sandbox` | bool | - | Skip all prompts and sandboxing (DANGEROUS) |
 #### Configuration Overrides
 | Flag | Type | Description |
 |------|------|-------------|
 | `-c, --config key=value` | string | Override config values (parsed as TOML) |
 | `-p, --profile NAME` | string | Use a configuration profile from config.toml |
 | `--enable FEATURE` | string | Enable a feature flag (repeatable) |
 | `--disable FEATURE` | string | Disable a feature flag (repeatable) |
 Config override examples:
 ```bash
 codex -c model="o3"
 codex -c 'sandbox_permissions=["disk-full-read-access"]'
 codex -c shell_environment_policy.inherit=all
 ```
 #### Additional Capabilities
 | Flag | Type | Description |
 |------|------|-------------|
 | `-i, --image FILE` | path[] | Attach image(s) to the initial prompt (repeatable) |
 | `--add-dir DIR` | path[] | Additional directories that should be writable (repeatable) |
 | `--search` | bool | Enable live web search via `web_search` tool |
 | `--output-schema FILE` | path | JSON Schema file for structured output |
 | `--skip-git-repo-check` | bool | Allow running outside a Git repository |
 | `--oss` | bool | Use local open source model provider (LM Studio/Ollama) |
 | `--local-provider PROVIDER` | enum | `lmstudio`, `ollama`, `ollama-chat` |
 | `--color COLOR` | enum | `always`, `never`, `auto` |
 ### Session Management
 ```bash
@ -140,6 +177,41 @@ Codex App Server uses JSON-RPC 2.0 over JSONL/stdin/stdout (no port required).
 - `thread/start` → starts a new thread
 - `turn/start` → sends user input for a thread
 ### Custom Args (JSON-RPC Parameters)
 #### `thread/start` Parameters
 | Field | Type | Description |
 |-------|------|-------------|
 | `approval_policy` | enum | `Never`, `Untrusted` - when to ask for approval |
 | `sandbox` | enum | `ReadOnly`, `DangerFullAccess` - sandbox mode |
 | `model` | string | Model to use for this thread |
 | `cwd` | string | Working directory |
 #### `turn/start` Parameters
 | Field | Type | Description |
 |-------|------|-------------|
 | `thread_id` | string | Thread ID from `thread/start` response |
 | `input` | array | User input (e.g., `[{ "type": "text", "text": "..." }]`) |
 | `approval_policy` | enum | Override approval policy for this turn |
 | `sandbox_policy` | enum | Override sandbox policy for this turn |
 | `model` | string | Override model for this turn |
 | `cwd` | string | Override working directory |
 | `effort` | string | Reasoning effort level |
 | `output_schema` | object | JSON Schema for structured output |
 | `summary` | string | Summary context for the turn |
 | `collaboration_mode` | string | Collaboration mode (if supported) |
 #### App Server CLI Flags
 | Flag | Description |
 |------|-------------|
 | `-c, --config key=value` | Override config (same as interactive mode) |
 | `--enable FEATURE` | Enable feature flag |
 | `--disable FEATURE` | Disable feature flag |
 | `--analytics-default-enabled` | Enable analytics by default (for first-party use) |
 ### Event Notifications (examples)
 ```json
--- a/research/agents/opencode.md
+++ b/research/agents/opencode.md
@ -34,18 +34,40 @@ opencode run -s SESSION_ID "prompt"   # Continue specific session
 opencode run -f file1.ts -f file2.ts "review these files"
 ```
-### Key CLI Flags
+### Custom Args (CLI Flags)
-| Flag | Description |
+
-|------|-------------|
+#### Core Flags
-| `--format json` | Output raw JSON events (for parsing) |
+
-| `-m, --model PROVIDER/MODEL` | Model in format `provider/model` |
+| Flag | Type | Description |
-| `--agent AGENT` | Agent to use (`build`, `plan`) |
+|------|------|-------------|
-| `-c, --continue` | Continue last session |
+| `-m, --model PROVIDER/MODEL` | string | Model in format `provider/model` (e.g., `anthropic/claude-sonnet-4-20250514`) |
-| `-s, --session ID` | Continue specific session |
+| `--agent AGENT` | string | Agent to use (`build`, `plan`, or custom agent ID) |
-| `-f, --file FILE` | Attach file(s) to message |
+| `--format FORMAT` | enum | `default` (formatted) or `json` (raw JSON events) |
-| `--attach URL` | Attach to running server |
+| `--variant VARIANT` | string | Reasoning effort level (e.g., `high`, `max`, `minimal`) |
-| `--port PORT` | Local server port |
+
-| `--variant VARIANT` | Reasoning effort (e.g., `high`, `max`) |
+#### Session Flags
 | Flag | Type | Description |
 |------|------|-------------|
 | `-c, --continue` | bool | Continue the last session |
 | `-s, --session ID` | string | Continue a specific session by ID |
 | `--title TEXT` | string | Title for the session (uses truncated prompt if omitted) |
 | `--share` | bool | Share the session publicly |
 #### Input/Output Flags
 | Flag | Type | Description |
 |------|------|-------------|
 | `-f, --file FILE` | path[] | Attach file(s) to message (repeatable) |
 | `--attach URL` | string | Attach to a running OpenCode server (e.g., `http://localhost:4096`) |
 | `--port PORT` | int | Port for the local server (random if not specified) |
 #### Debugging Flags
 | Flag | Type | Values | Description |
 |------|------|--------|-------------|
 | `--log-level LEVEL` | enum | `DEBUG`, `INFO`, `WARN`, `ERROR` | Log verbosity level |
 | `--print-logs` | bool | - | Print logs to stderr |
 ### Headless Server Mode
 ```bash
--- a/sdks/typescript/src/generated/openapi.ts
+++ b/sdks/typescript/src/generated/openapi.ts
@ -64,6 +64,10 @@ export interface components {
      permissions: boolean;
      planMode: boolean;
      questions: boolean;
      /** @description Whether this agent supports raw CLI arguments passed at session creation */
      rawSessionArgs: boolean;
      /** @description Whether this agent supports raw options passed at session creation */
      rawSessionOptions: boolean;
      reasoning: boolean;
      sessionLifecycle: boolean;
      /** @description Whether this agent uses a shared long-running server process (vs per-turn subprocess) */
@ -156,6 +160,12 @@ export interface components {
      model?: string | null;
      permissionMode?: string | null;
      variant?: string | null;
      /** @description Raw CLI arguments to pass to the agent (for CLI-based agents like Claude, OpenCode, Amp) */
      rawSessionArgs?: string[] | null;
      /** @description Raw options to pass to the agent (for long-running server agents like Codex) */
      rawSessionOptions?: {
        [key: string]: unknown;
      } | null;
    };
    CreateSessionResponse: {
      error?: components["schemas"]["AgentError"] | null;
--- a/server/packages/agent-management/src/agents.rs
+++ b/server/packages/agent-management/src/agents.rs
@ -237,6 +237,10 @@ impl AgentManager {
                    }
                    _ => {}
                }
                // Apply raw CLI args
                for arg in &options.raw_args {
                    command.arg(arg);
                }
                if options.streaming_input {
                    command
                        .arg("--input-format")
@ -268,6 +272,10 @@ impl AgentManager {
                if let Some(session_id) = options.session_id.as_deref() {
                    command.arg("-s").arg(session_id);
                }
                // Apply raw CLI args
                for arg in &options.raw_args {
                    command.arg(arg);
                }
                command.arg(&options.prompt);
            }
            AgentId::Amp => {
@ -583,6 +591,10 @@ impl AgentManager {
                    }
                    _ => {}
                }
                // Apply raw CLI args
                for arg in &options.raw_args {
                    command.arg(arg);
                }
                if options.streaming_input {
                    command
                        .arg("--input-format")
@ -614,6 +626,10 @@ impl AgentManager {
                if let Some(session_id) = options.session_id.as_deref() {
                    command.arg("-s").arg(session_id);
                }
                // Apply raw CLI args
                for arg in &options.raw_args {
                    command.arg(arg);
                }
                command.arg(&options.prompt);
            }
            AgentId::Amp => {
@ -682,6 +698,8 @@ pub struct SpawnOptions {
    pub env: HashMap<String, String>,
    /// Use stream-json input via stdin (Claude only).
    pub streaming_input: bool,
    /// Raw CLI arguments to pass to the agent (for CLI-based agents).
    pub raw_args: Vec<String>,
 }
 impl SpawnOptions {
@ -696,6 +714,7 @@ impl SpawnOptions {
            working_dir: None,
            env: HashMap::new(),
            streaming_input: false,
            raw_args: Vec::new(),
        }
    }
 }
@ -1054,7 +1073,12 @@ fn spawn_amp(
    if let Some(session_id) = options.session_id.as_deref() {
        command.arg("--continue").arg(session_id);
    }
-    command.args(&args).arg(&options.prompt);
+    command.args(&args);
    // Apply raw CLI args
    for arg in &options.raw_args {
        command.arg(arg);
    }
    command.arg(&options.prompt);
    for (key, value) in &options.env {
        command.env(key, value);
    }
@ -1095,6 +1119,10 @@ fn build_amp_command(path: &Path, working_dir: &Path, options: &SpawnOptions) ->
    if flags.dangerously_skip_permissions && options.permission_mode.as_deref() == Some("bypass") {
        command.arg("--dangerously-skip-permissions");
    }
    // Apply raw CLI args
    for arg in &options.raw_args {
        command.arg(arg);
    }
    command.arg(&options.prompt);
    for (key, value) in &options.env {
        command.env(key, value);
@ -1157,6 +1185,10 @@ fn spawn_amp_fallback(
        if !args.is_empty() {
            command.args(&args);
        }
        // Apply raw CLI args
        for arg in &options.raw_args {
            command.arg(arg);
        }
        command.arg(&options.prompt);
        for (key, value) in &options.env {
            command.env(key, value);
@ -1175,6 +1207,10 @@ fn spawn_amp_fallback(
    if let Some(session_id) = options.session_id.as_deref() {
        command.arg("--continue").arg(session_id);
    }
    // Apply raw CLI args
    for arg in &options.raw_args {
        command.arg(arg);
    }
    command.arg(&options.prompt);
    for (key, value) in &options.env {
        command.env(key, value);
--- a/server/packages/sandbox-agent/src/main.rs
+++ b/server/packages/sandbox-agent/src/main.rs
@ -591,6 +591,8 @@ fn run_sessions(command: &SessionsCommand, cli: &Cli) -> Result<(), CliError> {
                model: args.model.clone(),
                variant: args.variant.clone(),
                agent_version: args.agent_version.clone(),
                raw_session_args: None,
                raw_session_options: None,
            };
            let path = format!("{API_PREFIX}/sessions/{}", args.session_id);
            let response = ctx.post(&path, &body)?;
--- a/server/packages/sandbox-agent/src/opencode_compat.rs
+++ b/server/packages/sandbox-agent/src/opencode_compat.rs
@ -379,6 +379,8 @@ async fn ensure_backing_session(
        model: None,
        variant: None,
        agent_version: None,
        raw_session_args: None,
        raw_session_options: None,
    };
    match state
        .inner
--- a/server/packages/sandbox-agent/src/router.rs
+++ b/server/packages/sandbox-agent/src/router.rs
@ -323,6 +323,8 @@ struct SessionState {
    model: Option<String>,
    variant: Option<String>,
    native_session_id: Option<String>,
    raw_session_args: Option<Vec<String>>,
    raw_session_options: Option<serde_json::Value>,
    ended: bool,
    ended_exit_code: Option<i32>,
    ended_message: Option<String>,
@ -381,6 +383,8 @@ impl SessionState {
            model: request.model.clone(),
            variant: request.variant.clone(),
            native_session_id: None,
            raw_session_args: request.raw_session_args.clone(),
            raw_session_options: request.raw_session_options.clone(),
            ended: false,
            ended_exit_code: None,
            ended_message: None,
@ -1614,6 +1618,8 @@ impl SessionManager {
                model: session.model.clone(),
                variant: session.variant.clone(),
                native_session_id: None,
                raw_session_args: session.raw_session_args.clone(),
                raw_session_options: session.raw_session_options.clone(),
            };
            let thread_id = self.create_codex_thread(&session_id, &snapshot).await?;
            session.native_session_id = Some(thread_id);
@ -3079,6 +3085,15 @@ impl SessionManager {
        params.sandbox = codex_sandbox_mode(Some(&session.permission_mode));
        params.model = session.model.clone();
        // Merge raw_session_options into the config field if provided
        if let Some(serde_json::Value::Object(raw_options)) = &session.raw_session_options {
            let mut config = params.config.take().unwrap_or_default();
            for (key, value) in raw_options {
                config.insert(key.clone(), value.clone());
            }
            params.config = Some(config);
        }
        let request = codex_schema::ClientRequest::ThreadStart {
            id: codex_schema::RequestId::from(id),
            params,
@ -3488,6 +3503,10 @@ pub struct AgentCapabilities {
    pub item_started: bool,
    /// Whether this agent uses a shared long-running server process (vs per-turn subprocess)
    pub shared_process: bool,
    /// Whether this agent supports raw CLI arguments passed at session creation
    pub raw_session_args: bool,
    /// Whether this agent supports raw options passed at session creation (long-running server agents)
    pub raw_session_options: bool,
 }
 /// Status of a shared server process for an agent
@ -3575,6 +3594,12 @@ pub struct CreateSessionRequest {
    pub variant: Option<String>,
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub agent_version: Option<String>,
    /// Raw CLI arguments to pass to the agent (for CLI-based agents like Claude, OpenCode, Amp)
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub raw_session_args: Option<Vec<String>>,
    /// Raw options to pass to the agent (for long-running server agents like Codex)
    #[serde(default, skip_serializing_if = "Option::is_none")]
    pub raw_session_options: Option<serde_json::Value>,
 }
 #[derive(Debug, Clone, Serialize, Deserialize, ToSchema, JsonSchema)]
@ -4120,6 +4145,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
            streaming_deltas: true,
            item_started: false,
            shared_process: false, // per-turn subprocess with --resume
            raw_session_args: true,
            raw_session_options: false,
        },
        AgentId::Codex => AgentCapabilities {
            plan_mode: true,
@ -4140,6 +4167,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
            streaming_deltas: true,
            item_started: true,
            shared_process: true, // shared app-server via JSON-RPC
            raw_session_args: false,
            raw_session_options: true,
        },
        AgentId::Opencode => AgentCapabilities {
            plan_mode: false,
@ -4160,6 +4189,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
            streaming_deltas: true,
            item_started: true,
            shared_process: true, // shared HTTP server
            raw_session_args: true,
            raw_session_options: false,
        },
        AgentId::Amp => AgentCapabilities {
            plan_mode: false,
@ -4180,6 +4211,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
            streaming_deltas: false,
            item_started: false,
            shared_process: false, // per-turn subprocess with --continue
            raw_session_args: true,
            raw_session_options: false,
        },
        AgentId::Mock => AgentCapabilities {
            plan_mode: true,
@ -4200,6 +4233,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
            streaming_deltas: true,
            item_started: true,
            shared_process: false, // in-memory mock (no subprocess)
            raw_session_args: false,
            raw_session_options: false,
        },
    }
 }
@ -4434,6 +4469,7 @@ fn build_spawn_options(
            None
        }
    });
    options.raw_args = session.raw_session_args.clone().unwrap_or_default();
    if let Some(anthropic) = credentials.anthropic {
        options
            .env
@ -6461,6 +6497,8 @@ struct SessionSnapshot {
    model: Option<String>,
    variant: Option<String>,
    native_session_id: Option<String>,
    raw_session_args: Option<Vec<String>>,
    raw_session_options: Option<serde_json::Value>,
 }
 impl From<&SessionState> for SessionSnapshot {
@ -6473,6 +6511,8 @@ impl From<&SessionState> for SessionSnapshot {
            model: session.model.clone(),
            variant: session.variant.clone(),
            native_session_id: session.native_session_id.clone(),
            raw_session_args: session.raw_session_args.clone(),
            raw_session_options: session.raw_session_options.clone(),
        }
    }
 }
--- a/server/packages/sandbox-agent/tests/agent-management/mod.rs
+++ b/server/packages/sandbox-agent/tests/agent-management/mod.rs
@ -1 +1,2 @@
 mod agents;
 mod raw_session_args;
--- a/server/packages/sandbox-agent/tests/agent-management/raw_session_args.rs
+++ b/server/packages/sandbox-agent/tests/agent-management/raw_session_args.rs
@ -0,0 +1,50 @@
 use sandbox_agent_agent_management::agents::{AgentId, AgentManager, InstallOptions, SpawnOptions};
 /// Tests that raw_args are passed to CLI-based agents.
 /// We use `--version` as a raw arg which causes agents to print version info and exit.
 #[test]
 fn test_raw_args_version_flag() -> Result<(), Box<dyn std::error::Error>> {
    let temp_dir = tempfile::tempdir()?;
    let manager = AgentManager::new(temp_dir.path().join("bin"))?;
    // Test Claude with --version
    manager.install(AgentId::Claude, InstallOptions::default())?;
    let mut spawn = SpawnOptions::new("test");
    spawn.raw_args = vec!["--version".to_string()];
    let result = manager.spawn(AgentId::Claude, spawn)?;
    let output = format!("{}{}", result.stdout, result.stderr);
    assert!(
        output.to_lowercase().contains("version")
            || output.contains("claude")
            || result.status.code() == Some(0),
        "Claude --version failed: {output}"
    );
    // Test OpenCode with --version
    manager.install(AgentId::Opencode, InstallOptions::default())?;
    let mut spawn = SpawnOptions::new("test");
    spawn.raw_args = vec!["--version".to_string()];
    let result = manager.spawn(AgentId::Opencode, spawn)?;
    let output = format!("{}{}", result.stdout, result.stderr);
    assert!(
        output.to_lowercase().contains("version")
            || output.contains("opencode")
            || result.status.code() == Some(0),
        "OpenCode --version failed: {output}"
    );
    // Test Amp with --version
    manager.install(AgentId::Amp, InstallOptions::default())?;
    let mut spawn = SpawnOptions::new("test");
    spawn.raw_args = vec!["--version".to_string()];
    let result = manager.spawn(AgentId::Amp, spawn)?;
    let output = format!("{}{}", result.stdout, result.stderr);
    assert!(
        output.to_lowercase().contains("version")
            || output.contains("amp")
            || result.status.code() == Some(0),
        "Amp --version failed: {output}"
    );
    Ok(())
 }
`@ -1 +1,2 @@`
	`mod agents;`	`mod agents;`
		`mod raw_session_args;`