feat: add raw session args/opts for agent passthrough

This commit is contained in:
Nathan Flurry 2026-02-05 11:32:39 -08:00
parent 375d73e4cb
commit 2f26f76d9b
14 changed files with 365 additions and 37 deletions

View file

@ -669,7 +669,9 @@
"mcpTools", "mcpTools",
"streamingDeltas", "streamingDeltas",
"itemStarted", "itemStarted",
"sharedProcess" "sharedProcess",
"rawSessionArgs",
"rawSessionOptions"
], ],
"properties": { "properties": {
"commandExecution": { "commandExecution": {
@ -702,6 +704,14 @@
"questions": { "questions": {
"type": "boolean" "type": "boolean"
}, },
"rawSessionArgs": {
"type": "boolean",
"description": "Whether this agent supports raw CLI arguments passed at session creation"
},
"rawSessionOptions": {
"type": "boolean",
"description": "Whether this agent supports raw options passed at session creation"
},
"reasoning": { "reasoning": {
"type": "boolean" "type": "boolean"
}, },
@ -1074,6 +1084,20 @@
"variant": { "variant": {
"type": "string", "type": "string",
"nullable": true "nullable": true
},
"rawSessionArgs": {
"type": "array",
"items": {
"type": "string"
},
"nullable": true,
"description": "Raw CLI arguments to pass to the agent (for CLI-based agents like Claude, OpenCode, Amp)"
},
"rawSessionOptions": {
"type": "object",
"additionalProperties": true,
"nullable": true,
"description": "Raw options to pass to the agent (for long-running server agents like Codex)"
} }
} }
}, },

View file

@ -62,6 +62,26 @@ await client.createSession("demo-session", {
await client.postMessage("demo-session", { message: "Hello" }); await client.postMessage("demo-session", { message: "Hello" });
``` ```
### Raw session arguments
Pass low-level arguments directly to agents at session creation:
```ts
// CLI args for Claude, OpenCode, Amp (not Codex)
await client.createSession("my-session", {
agent: "claude",
rawSessionArgs: ["--max-turns", "5"],
});
// Options passed through agent's native protocol (long-running servers only)
await client.createSession("my-session", {
agent: "codex",
rawSessionOptions: { sandbox: "workspace-write" },
});
```
Check `capabilities.rawSessionArgs` and `capabilities.rawSessionOptions` to see what each agent supports.
List agents and inspect feature coverage (available on `capabilities`): List agents and inspect feature coverage (available on `capabilities`):
```ts ```ts

View file

@ -29,6 +29,8 @@ This table shows which agent feature coverage appears in the universal event str
| File Changes | - | ✓ | - | - | | File Changes | - | ✓ | - | - |
| MCP Tools | - | ✓ | - | - | | MCP Tools | - | ✓ | - | - |
| Streaming Deltas | ✓ | ✓ | ✓ | - | | Streaming Deltas | ✓ | ✓ | ✓ | - |
| Raw Session Args | ✓ | | ✓ | ✓ |
| Raw Session Options| ✓ | ✓ | ✓ | ✓ |
Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview) · [Codex](https://github.com/openai/codex) · [OpenCode](https://github.com/opencode-ai/opencode) · [Amp](https://ampcode.com) Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude-code/overview) · [Codex](https://github.com/openai/codex) · [OpenCode](https://github.com/opencode-ai/opencode) · [Amp](https://ampcode.com)
@ -76,6 +78,12 @@ Agents: [Claude Code](https://docs.anthropic.com/en/docs/agents-and-tools/claude
<Accordion title="Streaming Deltas"> <Accordion title="Streaming Deltas">
Native streaming of content deltas. When not supported, the daemon emits a single synthetic delta before `item.completed`. Native streaming of content deltas. When not supported, the daemon emits a single synthetic delta before `item.completed`.
</Accordion> </Accordion>
<Accordion title="Raw Session Args">
Pass raw CLI arguments directly to the agent at session creation via `rawSessionArgs`. Only supported for CLI-based agents (Claude, OpenCode, Amp). Codex uses JSON-RPC, so CLI args are not applicable.
</Accordion>
<Accordion title="Raw Session Options">
Pass raw options to the agent at session creation via `rawSessionOptions`. For long-running server agents, options are passed through the agent's native protocol. For Codex, options are merged into the `thread/start` config.
</Accordion>
</AccordionGroup> </AccordionGroup>
Want support for another agent? [Open an issue](https://github.com/rivet-dev/sandbox-agent/issues/new) to request it. Want support for another agent? [Open an issue](https://github.com/rivet-dev/sandbox-agent/issues/new) to request it.

View file

@ -25,16 +25,32 @@ amp --print --output-format stream-json --dangerously-skip-permissions "prompt"
amp --continue SESSION_ID "follow up" amp --continue SESSION_ID "follow up"
``` ```
### Key CLI Flags ### Custom Args (CLI Flags)
| Flag | Description | #### Core Flags
|------|-------------|
| `--print` | Output mode (non-interactive) | | Flag | Type | Description |
| `--output-format stream-json` | JSONL streaming output | |------|------|-------------|
| `--dangerously-skip-permissions` | Skip permission prompts | | `--print` | bool | Output mode (non-interactive) |
| `--continue SESSION_ID` | Resume existing session | | `--execute` | bool | Alternative output mode (some versions) |
| `--model MODEL` | Specify model | | `--output-format stream-json` | string | JSONL streaming output |
| `--toolbox TOOLBOX` | Toolbox configuration | | `--model MODEL` | string | Specify model to use |
| `--continue SESSION_ID` | string | Resume existing session |
#### Permission Flags
| Flag | Type | Description |
|------|------|-------------|
| `--dangerously-skip-permissions` | bool | Skip all permission prompts |
#### Configuration Flags
| Flag | Type | Description |
|------|------|-------------|
| `--toolbox NAME` | string | Toolbox configuration to use |
| `--mcp-config FILE` | path | Path to MCP configuration file |
**Note:** Amp CLI flags vary by version. The daemon uses flag detection (`amp --help`) to determine which flags are supported before invocation.
## Credential Discovery ## Credential Discovery

View file

@ -71,17 +71,42 @@ claude \
"PROMPT" "PROMPT"
``` ```
### Arguments ### Core Arguments
| Flag | Description | | Flag | Description |
|------|-------------| |------|-------------|
| `--print` | Output mode | | `--print` | Output mode (non-interactive) |
| `--output-format stream-json` | Newline-delimited JSON streaming | | `--output-format stream-json` | Newline-delimited JSON streaming |
| `--verbose` | Verbose output | | `--verbose` | Verbose output |
| `--dangerously-skip-permissions` | Skip permission prompts | | `--dangerously-skip-permissions` | Skip permission prompts |
| `--resume SESSION_ID` | Resume existing session | | `--resume SESSION_ID` | Resume existing session |
| `--model MODEL_ID` | Specify model (e.g., `claude-sonnet-4-20250514`) | | `--model MODEL_ID` | Specify model (e.g., `claude-sonnet-4-20250514`) |
| `--permission-mode plan` | Plan mode (read-only exploration) | | `--permission-mode MODE` | Permission mode (`plan`, `acceptEdits`) |
### Custom Args (Session Configuration)
These flags can be passed to customize agent behavior at session start:
| Flag | Type | Description |
|------|------|-------------|
| `--max-turns N` | int | Maximum number of agent turns before stopping |
| `--system-prompt TEXT` | string | Custom system prompt (replaces default) |
| `--append-system-prompt TEXT` | string | Text to append to the system prompt |
| `--allowed-tools TOOLS` | string (comma-sep) | Comma-separated list of allowed tools |
| `--disallowed-tools TOOLS` | string (comma-sep) | Comma-separated list of disallowed tools |
| `--mcp-server NAME` | string | Add an MCP server by name |
| `--timeout-secs N` | int | Timeout in seconds (overrides default 300s) |
| `--profile NAME` | string | Use a specific configuration profile |
### Streaming Input Mode Flags
When using `--input-format stream-json` for streaming input:
| Flag | Description |
|------|-------------|
| `--input-format stream-json` | Accept streaming JSON input via stdin |
| `--permission-prompt-tool stdio` | Handle permission prompts via stdio |
| `--include-partial-messages` | Include partial message events in output |
### Environment Variables ### Environment Variables

View file

@ -41,17 +41,54 @@ codex exec --dangerously-bypass-approvals-and-sandbox "prompt"
codex exec resume --last # Resume previous session codex exec resume --last # Resume previous session
``` ```
### Key CLI Flags ### Custom Args (CLI Flags)
| Flag | Description |
|------|-------------| #### Core Flags
| `--json` | Print events to stdout as JSONL |
| `-m, --model MODEL` | Model to use | | Flag | Type | Description |
| `-s, --sandbox MODE` | `read-only`, `workspace-write`, `danger-full-access` | |------|------|-------------|
| `--full-auto` | Auto-approve with workspace-write sandbox | | `-m, --model MODEL` | string | Model to use (e.g., `o3`, `gpt-4o`) |
| `--dangerously-bypass-approvals-and-sandbox` | Skip all prompts (dangerous) | | `--json` | bool | Print events to stdout as JSONL |
| `-C, --cd DIR` | Working directory | | `-C, --cd DIR` | path | Working directory for the agent |
| `-o, --output-last-message FILE` | Write final response to file | | `-o, --output-last-message FILE` | path | Write final response to file |
| `--output-schema FILE` | JSON Schema for structured output |
#### Permission & Sandbox Flags
| Flag | Type | Values | Description |
|------|------|--------|-------------|
| `-s, --sandbox MODE` | enum | `read-only`, `workspace-write`, `danger-full-access` | Sandbox policy for shell commands |
| `-a, --ask-for-approval POLICY` | enum | `untrusted`, `on-failure`, `on-request`, `never` | When to require human approval |
| `--full-auto` | bool | - | Convenience alias: `-a on-request --sandbox workspace-write` |
| `--dangerously-bypass-approvals-and-sandbox` | bool | - | Skip all prompts and sandboxing (DANGEROUS) |
#### Configuration Overrides
| Flag | Type | Description |
|------|------|-------------|
| `-c, --config key=value` | string | Override config values (parsed as TOML) |
| `-p, --profile NAME` | string | Use a configuration profile from config.toml |
| `--enable FEATURE` | string | Enable a feature flag (repeatable) |
| `--disable FEATURE` | string | Disable a feature flag (repeatable) |
Config override examples:
```bash
codex -c model="o3"
codex -c 'sandbox_permissions=["disk-full-read-access"]'
codex -c shell_environment_policy.inherit=all
```
#### Additional Capabilities
| Flag | Type | Description |
|------|------|-------------|
| `-i, --image FILE` | path[] | Attach image(s) to the initial prompt (repeatable) |
| `--add-dir DIR` | path[] | Additional directories that should be writable (repeatable) |
| `--search` | bool | Enable live web search via `web_search` tool |
| `--output-schema FILE` | path | JSON Schema file for structured output |
| `--skip-git-repo-check` | bool | Allow running outside a Git repository |
| `--oss` | bool | Use local open source model provider (LM Studio/Ollama) |
| `--local-provider PROVIDER` | enum | `lmstudio`, `ollama`, `ollama-chat` |
| `--color COLOR` | enum | `always`, `never`, `auto` |
### Session Management ### Session Management
```bash ```bash
@ -140,6 +177,41 @@ Codex App Server uses JSON-RPC 2.0 over JSONL/stdin/stdout (no port required).
- `thread/start` → starts a new thread - `thread/start` → starts a new thread
- `turn/start` → sends user input for a thread - `turn/start` → sends user input for a thread
### Custom Args (JSON-RPC Parameters)
#### `thread/start` Parameters
| Field | Type | Description |
|-------|------|-------------|
| `approval_policy` | enum | `Never`, `Untrusted` - when to ask for approval |
| `sandbox` | enum | `ReadOnly`, `DangerFullAccess` - sandbox mode |
| `model` | string | Model to use for this thread |
| `cwd` | string | Working directory |
#### `turn/start` Parameters
| Field | Type | Description |
|-------|------|-------------|
| `thread_id` | string | Thread ID from `thread/start` response |
| `input` | array | User input (e.g., `[{ "type": "text", "text": "..." }]`) |
| `approval_policy` | enum | Override approval policy for this turn |
| `sandbox_policy` | enum | Override sandbox policy for this turn |
| `model` | string | Override model for this turn |
| `cwd` | string | Override working directory |
| `effort` | string | Reasoning effort level |
| `output_schema` | object | JSON Schema for structured output |
| `summary` | string | Summary context for the turn |
| `collaboration_mode` | string | Collaboration mode (if supported) |
#### App Server CLI Flags
| Flag | Description |
|------|-------------|
| `-c, --config key=value` | Override config (same as interactive mode) |
| `--enable FEATURE` | Enable feature flag |
| `--disable FEATURE` | Disable feature flag |
| `--analytics-default-enabled` | Enable analytics by default (for first-party use) |
### Event Notifications (examples) ### Event Notifications (examples)
```json ```json

View file

@ -34,18 +34,40 @@ opencode run -s SESSION_ID "prompt" # Continue specific session
opencode run -f file1.ts -f file2.ts "review these files" opencode run -f file1.ts -f file2.ts "review these files"
``` ```
### Key CLI Flags ### Custom Args (CLI Flags)
| Flag | Description |
|------|-------------| #### Core Flags
| `--format json` | Output raw JSON events (for parsing) |
| `-m, --model PROVIDER/MODEL` | Model in format `provider/model` | | Flag | Type | Description |
| `--agent AGENT` | Agent to use (`build`, `plan`) | |------|------|-------------|
| `-c, --continue` | Continue last session | | `-m, --model PROVIDER/MODEL` | string | Model in format `provider/model` (e.g., `anthropic/claude-sonnet-4-20250514`) |
| `-s, --session ID` | Continue specific session | | `--agent AGENT` | string | Agent to use (`build`, `plan`, or custom agent ID) |
| `-f, --file FILE` | Attach file(s) to message | | `--format FORMAT` | enum | `default` (formatted) or `json` (raw JSON events) |
| `--attach URL` | Attach to running server | | `--variant VARIANT` | string | Reasoning effort level (e.g., `high`, `max`, `minimal`) |
| `--port PORT` | Local server port |
| `--variant VARIANT` | Reasoning effort (e.g., `high`, `max`) | #### Session Flags
| Flag | Type | Description |
|------|------|-------------|
| `-c, --continue` | bool | Continue the last session |
| `-s, --session ID` | string | Continue a specific session by ID |
| `--title TEXT` | string | Title for the session (uses truncated prompt if omitted) |
| `--share` | bool | Share the session publicly |
#### Input/Output Flags
| Flag | Type | Description |
|------|------|-------------|
| `-f, --file FILE` | path[] | Attach file(s) to message (repeatable) |
| `--attach URL` | string | Attach to a running OpenCode server (e.g., `http://localhost:4096`) |
| `--port PORT` | int | Port for the local server (random if not specified) |
#### Debugging Flags
| Flag | Type | Values | Description |
|------|------|--------|-------------|
| `--log-level LEVEL` | enum | `DEBUG`, `INFO`, `WARN`, `ERROR` | Log verbosity level |
| `--print-logs` | bool | - | Print logs to stderr |
### Headless Server Mode ### Headless Server Mode
```bash ```bash

View file

@ -64,6 +64,10 @@ export interface components {
permissions: boolean; permissions: boolean;
planMode: boolean; planMode: boolean;
questions: boolean; questions: boolean;
/** @description Whether this agent supports raw CLI arguments passed at session creation */
rawSessionArgs: boolean;
/** @description Whether this agent supports raw options passed at session creation */
rawSessionOptions: boolean;
reasoning: boolean; reasoning: boolean;
sessionLifecycle: boolean; sessionLifecycle: boolean;
/** @description Whether this agent uses a shared long-running server process (vs per-turn subprocess) */ /** @description Whether this agent uses a shared long-running server process (vs per-turn subprocess) */
@ -156,6 +160,12 @@ export interface components {
model?: string | null; model?: string | null;
permissionMode?: string | null; permissionMode?: string | null;
variant?: string | null; variant?: string | null;
/** @description Raw CLI arguments to pass to the agent (for CLI-based agents like Claude, OpenCode, Amp) */
rawSessionArgs?: string[] | null;
/** @description Raw options to pass to the agent (for long-running server agents like Codex) */
rawSessionOptions?: {
[key: string]: unknown;
} | null;
}; };
CreateSessionResponse: { CreateSessionResponse: {
error?: components["schemas"]["AgentError"] | null; error?: components["schemas"]["AgentError"] | null;

View file

@ -237,6 +237,10 @@ impl AgentManager {
} }
_ => {} _ => {}
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
if options.streaming_input { if options.streaming_input {
command command
.arg("--input-format") .arg("--input-format")
@ -268,6 +272,10 @@ impl AgentManager {
if let Some(session_id) = options.session_id.as_deref() { if let Some(session_id) = options.session_id.as_deref() {
command.arg("-s").arg(session_id); command.arg("-s").arg(session_id);
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
command.arg(&options.prompt); command.arg(&options.prompt);
} }
AgentId::Amp => { AgentId::Amp => {
@ -583,6 +591,10 @@ impl AgentManager {
} }
_ => {} _ => {}
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
if options.streaming_input { if options.streaming_input {
command command
.arg("--input-format") .arg("--input-format")
@ -614,6 +626,10 @@ impl AgentManager {
if let Some(session_id) = options.session_id.as_deref() { if let Some(session_id) = options.session_id.as_deref() {
command.arg("-s").arg(session_id); command.arg("-s").arg(session_id);
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
command.arg(&options.prompt); command.arg(&options.prompt);
} }
AgentId::Amp => { AgentId::Amp => {
@ -682,6 +698,8 @@ pub struct SpawnOptions {
pub env: HashMap<String, String>, pub env: HashMap<String, String>,
/// Use stream-json input via stdin (Claude only). /// Use stream-json input via stdin (Claude only).
pub streaming_input: bool, pub streaming_input: bool,
/// Raw CLI arguments to pass to the agent (for CLI-based agents).
pub raw_args: Vec<String>,
} }
impl SpawnOptions { impl SpawnOptions {
@ -696,6 +714,7 @@ impl SpawnOptions {
working_dir: None, working_dir: None,
env: HashMap::new(), env: HashMap::new(),
streaming_input: false, streaming_input: false,
raw_args: Vec::new(),
} }
} }
} }
@ -1054,7 +1073,12 @@ fn spawn_amp(
if let Some(session_id) = options.session_id.as_deref() { if let Some(session_id) = options.session_id.as_deref() {
command.arg("--continue").arg(session_id); command.arg("--continue").arg(session_id);
} }
command.args(&args).arg(&options.prompt); command.args(&args);
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
command.arg(&options.prompt);
for (key, value) in &options.env { for (key, value) in &options.env {
command.env(key, value); command.env(key, value);
} }
@ -1095,6 +1119,10 @@ fn build_amp_command(path: &Path, working_dir: &Path, options: &SpawnOptions) ->
if flags.dangerously_skip_permissions && options.permission_mode.as_deref() == Some("bypass") { if flags.dangerously_skip_permissions && options.permission_mode.as_deref() == Some("bypass") {
command.arg("--dangerously-skip-permissions"); command.arg("--dangerously-skip-permissions");
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
command.arg(&options.prompt); command.arg(&options.prompt);
for (key, value) in &options.env { for (key, value) in &options.env {
command.env(key, value); command.env(key, value);
@ -1157,6 +1185,10 @@ fn spawn_amp_fallback(
if !args.is_empty() { if !args.is_empty() {
command.args(&args); command.args(&args);
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
command.arg(&options.prompt); command.arg(&options.prompt);
for (key, value) in &options.env { for (key, value) in &options.env {
command.env(key, value); command.env(key, value);
@ -1175,6 +1207,10 @@ fn spawn_amp_fallback(
if let Some(session_id) = options.session_id.as_deref() { if let Some(session_id) = options.session_id.as_deref() {
command.arg("--continue").arg(session_id); command.arg("--continue").arg(session_id);
} }
// Apply raw CLI args
for arg in &options.raw_args {
command.arg(arg);
}
command.arg(&options.prompt); command.arg(&options.prompt);
for (key, value) in &options.env { for (key, value) in &options.env {
command.env(key, value); command.env(key, value);

View file

@ -591,6 +591,8 @@ fn run_sessions(command: &SessionsCommand, cli: &Cli) -> Result<(), CliError> {
model: args.model.clone(), model: args.model.clone(),
variant: args.variant.clone(), variant: args.variant.clone(),
agent_version: args.agent_version.clone(), agent_version: args.agent_version.clone(),
raw_session_args: None,
raw_session_options: None,
}; };
let path = format!("{API_PREFIX}/sessions/{}", args.session_id); let path = format!("{API_PREFIX}/sessions/{}", args.session_id);
let response = ctx.post(&path, &body)?; let response = ctx.post(&path, &body)?;

View file

@ -379,6 +379,8 @@ async fn ensure_backing_session(
model: None, model: None,
variant: None, variant: None,
agent_version: None, agent_version: None,
raw_session_args: None,
raw_session_options: None,
}; };
match state match state
.inner .inner

View file

@ -323,6 +323,8 @@ struct SessionState {
model: Option<String>, model: Option<String>,
variant: Option<String>, variant: Option<String>,
native_session_id: Option<String>, native_session_id: Option<String>,
raw_session_args: Option<Vec<String>>,
raw_session_options: Option<serde_json::Value>,
ended: bool, ended: bool,
ended_exit_code: Option<i32>, ended_exit_code: Option<i32>,
ended_message: Option<String>, ended_message: Option<String>,
@ -381,6 +383,8 @@ impl SessionState {
model: request.model.clone(), model: request.model.clone(),
variant: request.variant.clone(), variant: request.variant.clone(),
native_session_id: None, native_session_id: None,
raw_session_args: request.raw_session_args.clone(),
raw_session_options: request.raw_session_options.clone(),
ended: false, ended: false,
ended_exit_code: None, ended_exit_code: None,
ended_message: None, ended_message: None,
@ -1614,6 +1618,8 @@ impl SessionManager {
model: session.model.clone(), model: session.model.clone(),
variant: session.variant.clone(), variant: session.variant.clone(),
native_session_id: None, native_session_id: None,
raw_session_args: session.raw_session_args.clone(),
raw_session_options: session.raw_session_options.clone(),
}; };
let thread_id = self.create_codex_thread(&session_id, &snapshot).await?; let thread_id = self.create_codex_thread(&session_id, &snapshot).await?;
session.native_session_id = Some(thread_id); session.native_session_id = Some(thread_id);
@ -3079,6 +3085,15 @@ impl SessionManager {
params.sandbox = codex_sandbox_mode(Some(&session.permission_mode)); params.sandbox = codex_sandbox_mode(Some(&session.permission_mode));
params.model = session.model.clone(); params.model = session.model.clone();
// Merge raw_session_options into the config field if provided
if let Some(serde_json::Value::Object(raw_options)) = &session.raw_session_options {
let mut config = params.config.take().unwrap_or_default();
for (key, value) in raw_options {
config.insert(key.clone(), value.clone());
}
params.config = Some(config);
}
let request = codex_schema::ClientRequest::ThreadStart { let request = codex_schema::ClientRequest::ThreadStart {
id: codex_schema::RequestId::from(id), id: codex_schema::RequestId::from(id),
params, params,
@ -3488,6 +3503,10 @@ pub struct AgentCapabilities {
pub item_started: bool, pub item_started: bool,
/// Whether this agent uses a shared long-running server process (vs per-turn subprocess) /// Whether this agent uses a shared long-running server process (vs per-turn subprocess)
pub shared_process: bool, pub shared_process: bool,
/// Whether this agent supports raw CLI arguments passed at session creation
pub raw_session_args: bool,
/// Whether this agent supports raw options passed at session creation (long-running server agents)
pub raw_session_options: bool,
} }
/// Status of a shared server process for an agent /// Status of a shared server process for an agent
@ -3575,6 +3594,12 @@ pub struct CreateSessionRequest {
pub variant: Option<String>, pub variant: Option<String>,
#[serde(default, skip_serializing_if = "Option::is_none")] #[serde(default, skip_serializing_if = "Option::is_none")]
pub agent_version: Option<String>, pub agent_version: Option<String>,
/// Raw CLI arguments to pass to the agent (for CLI-based agents like Claude, OpenCode, Amp)
#[serde(default, skip_serializing_if = "Option::is_none")]
pub raw_session_args: Option<Vec<String>>,
/// Raw options to pass to the agent (for long-running server agents like Codex)
#[serde(default, skip_serializing_if = "Option::is_none")]
pub raw_session_options: Option<serde_json::Value>,
} }
#[derive(Debug, Clone, Serialize, Deserialize, ToSchema, JsonSchema)] #[derive(Debug, Clone, Serialize, Deserialize, ToSchema, JsonSchema)]
@ -4120,6 +4145,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
streaming_deltas: true, streaming_deltas: true,
item_started: false, item_started: false,
shared_process: false, // per-turn subprocess with --resume shared_process: false, // per-turn subprocess with --resume
raw_session_args: true,
raw_session_options: false,
}, },
AgentId::Codex => AgentCapabilities { AgentId::Codex => AgentCapabilities {
plan_mode: true, plan_mode: true,
@ -4140,6 +4167,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
streaming_deltas: true, streaming_deltas: true,
item_started: true, item_started: true,
shared_process: true, // shared app-server via JSON-RPC shared_process: true, // shared app-server via JSON-RPC
raw_session_args: false,
raw_session_options: true,
}, },
AgentId::Opencode => AgentCapabilities { AgentId::Opencode => AgentCapabilities {
plan_mode: false, plan_mode: false,
@ -4160,6 +4189,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
streaming_deltas: true, streaming_deltas: true,
item_started: true, item_started: true,
shared_process: true, // shared HTTP server shared_process: true, // shared HTTP server
raw_session_args: true,
raw_session_options: false,
}, },
AgentId::Amp => AgentCapabilities { AgentId::Amp => AgentCapabilities {
plan_mode: false, plan_mode: false,
@ -4180,6 +4211,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
streaming_deltas: false, streaming_deltas: false,
item_started: false, item_started: false,
shared_process: false, // per-turn subprocess with --continue shared_process: false, // per-turn subprocess with --continue
raw_session_args: true,
raw_session_options: false,
}, },
AgentId::Mock => AgentCapabilities { AgentId::Mock => AgentCapabilities {
plan_mode: true, plan_mode: true,
@ -4200,6 +4233,8 @@ fn agent_capabilities_for(agent: AgentId) -> AgentCapabilities {
streaming_deltas: true, streaming_deltas: true,
item_started: true, item_started: true,
shared_process: false, // in-memory mock (no subprocess) shared_process: false, // in-memory mock (no subprocess)
raw_session_args: false,
raw_session_options: false,
}, },
} }
} }
@ -4434,6 +4469,7 @@ fn build_spawn_options(
None None
} }
}); });
options.raw_args = session.raw_session_args.clone().unwrap_or_default();
if let Some(anthropic) = credentials.anthropic { if let Some(anthropic) = credentials.anthropic {
options options
.env .env
@ -6461,6 +6497,8 @@ struct SessionSnapshot {
model: Option<String>, model: Option<String>,
variant: Option<String>, variant: Option<String>,
native_session_id: Option<String>, native_session_id: Option<String>,
raw_session_args: Option<Vec<String>>,
raw_session_options: Option<serde_json::Value>,
} }
impl From<&SessionState> for SessionSnapshot { impl From<&SessionState> for SessionSnapshot {
@ -6473,6 +6511,8 @@ impl From<&SessionState> for SessionSnapshot {
model: session.model.clone(), model: session.model.clone(),
variant: session.variant.clone(), variant: session.variant.clone(),
native_session_id: session.native_session_id.clone(), native_session_id: session.native_session_id.clone(),
raw_session_args: session.raw_session_args.clone(),
raw_session_options: session.raw_session_options.clone(),
} }
} }
} }

View file

@ -1 +1,2 @@
mod agents; mod agents;
mod raw_session_args;

View file

@ -0,0 +1,50 @@
use sandbox_agent_agent_management::agents::{AgentId, AgentManager, InstallOptions, SpawnOptions};
/// Tests that raw_args are passed to CLI-based agents.
/// We use `--version` as a raw arg which causes agents to print version info and exit.
#[test]
fn test_raw_args_version_flag() -> Result<(), Box<dyn std::error::Error>> {
let temp_dir = tempfile::tempdir()?;
let manager = AgentManager::new(temp_dir.path().join("bin"))?;
// Test Claude with --version
manager.install(AgentId::Claude, InstallOptions::default())?;
let mut spawn = SpawnOptions::new("test");
spawn.raw_args = vec!["--version".to_string()];
let result = manager.spawn(AgentId::Claude, spawn)?;
let output = format!("{}{}", result.stdout, result.stderr);
assert!(
output.to_lowercase().contains("version")
|| output.contains("claude")
|| result.status.code() == Some(0),
"Claude --version failed: {output}"
);
// Test OpenCode with --version
manager.install(AgentId::Opencode, InstallOptions::default())?;
let mut spawn = SpawnOptions::new("test");
spawn.raw_args = vec!["--version".to_string()];
let result = manager.spawn(AgentId::Opencode, spawn)?;
let output = format!("{}{}", result.stdout, result.stderr);
assert!(
output.to_lowercase().contains("version")
|| output.contains("opencode")
|| result.status.code() == Some(0),
"OpenCode --version failed: {output}"
);
// Test Amp with --version
manager.install(AgentId::Amp, InstallOptions::default())?;
let mut spawn = SpawnOptions::new("test");
spawn.raw_args = vec!["--version".to_string()];
let result = manager.spawn(AgentId::Amp, spawn)?;
let output = format!("{}{}", result.stdout, result.stderr);
assert!(
output.to_lowercase().contains("version")
|| output.contains("amp")
|| result.status.code() == Some(0),
"Amp --version failed: {output}"
);
Ok(())
}