llmx-rs/core/src/unified_exec/mod.rs

//! Unified Exec: interactive PTY execution orchestrated with approvals + sandboxing.
//!
//! Responsibilities
//! - Manages interactive PTY sessions (create, reuse, buffer output with caps).
//! - Uses the shared ToolOrchestrator to handle approval, sandbox selection, and
//!   retry semantics in a single, descriptive flow.
//! - Spawns the PTY from a sandbox‑transformed `ExecEnv`; on sandbox denial,
//!   retries without sandbox when policy allows (no re‑prompt thanks to caching).
//! - Uses the shared `is_likely_sandbox_denied` heuristic to keep denial messages
//!   consistent with other exec paths.
//!
//! Flow at a glance (open session)
//! 1) Build a small request `{ command, cwd }`.
//! 2) Orchestrator: approval (bypass/cache/prompt) → select sandbox → run.
//! 3) Runtime: transform `CommandSpec` → `ExecEnv` → spawn PTY.
//! 4) If denial, orchestrator retries with `SandboxType::None`.
//! 5) Session is returned with streaming output + metadata.
//!
//! This keeps policy logic and user interaction centralized while the PTY/session
//! concerns remain isolated here. The implementation is split between:
//! - `session.rs`: PTY session lifecycle + output buffering.
//! - `session_manager.rs`: orchestration (approvals, sandboxing, reuse) and request handling.

use std::collections::HashMap;
use std::path::PathBuf;
use std::sync::Arc;
use std::sync::atomic::AtomicI32;
use std::time::Duration;

use rand::Rng;
use rand::rng;
use tokio::sync::Mutex;

use crate::codex::Session;
use crate::codex::TurnContext;

mod errors;
mod session;
mod session_manager;

pub(crate) use errors::UnifiedExecError;
pub(crate) use session::UnifiedExecSession;

pub(crate) const DEFAULT_YIELD_TIME_MS: u64 = 10_000;
pub(crate) const MIN_YIELD_TIME_MS: u64 = 250;
pub(crate) const MAX_YIELD_TIME_MS: u64 = 30_000;
pub(crate) const DEFAULT_MAX_OUTPUT_TOKENS: usize = 10_000;
pub(crate) const UNIFIED_EXEC_OUTPUT_MAX_BYTES: usize = 1024 * 1024; // 1 MiB

pub(crate) struct UnifiedExecContext {
    pub session: Arc<Session>,
    pub turn: Arc<TurnContext>,
    pub call_id: String,
}

impl UnifiedExecContext {
    pub fn new(session: Arc<Session>, turn: Arc<TurnContext>, call_id: String) -> Self {
        Self {
            session,
            turn,
            call_id,
        }
    }
}

#[derive(Debug)]
pub(crate) struct ExecCommandRequest<'a> {
    pub command: &'a str,
    pub shell: &'a str,
    pub login: bool,
    pub yield_time_ms: Option<u64>,
    pub max_output_tokens: Option<usize>,
    pub workdir: Option<PathBuf>,
}

#[derive(Debug)]
pub(crate) struct WriteStdinRequest<'a> {
    pub session_id: i32,
    pub input: &'a str,
    pub yield_time_ms: Option<u64>,
    pub max_output_tokens: Option<usize>,
}

#[derive(Debug, Clone, PartialEq)]
pub(crate) struct UnifiedExecResponse {
    pub event_call_id: String,
    pub chunk_id: String,
    pub wall_time: Duration,
    pub output: String,
    pub session_id: Option<i32>,
    pub exit_code: Option<i32>,
    pub original_token_count: Option<usize>,
}

#[derive(Default)]
pub(crate) struct UnifiedExecSessionManager {
    next_session_id: AtomicI32,
    sessions: Mutex<HashMap<i32, SessionEntry>>,
}

struct SessionEntry {
    session: session::UnifiedExecSession,
    session_ref: Arc<Session>,
    turn_ref: Arc<TurnContext>,
    call_id: String,
    command: String,
    cwd: PathBuf,
    started_at: tokio::time::Instant,
}

pub(crate) fn clamp_yield_time(yield_time_ms: Option<u64>) -> u64 {
    match yield_time_ms {
        Some(value) => value.clamp(MIN_YIELD_TIME_MS, MAX_YIELD_TIME_MS),
        None => DEFAULT_YIELD_TIME_MS,
    }
}

pub(crate) fn resolve_max_tokens(max_tokens: Option<usize>) -> usize {
    max_tokens.unwrap_or(DEFAULT_MAX_OUTPUT_TOKENS)
}

pub(crate) fn generate_chunk_id() -> String {
    let mut rng = rng();
    (0..6)
        .map(|_| format!("{:x}", rng.random_range(0..16)))
        .collect()
}

pub(crate) fn truncate_output_to_tokens(
    output: &str,
    max_tokens: usize,
) -> (String, Option<usize>) {
    if max_tokens == 0 {
        let total_tokens = output.chars().count();
        let message = format!("…{total_tokens} tokens truncated…");
        return (message, Some(total_tokens));
    }

    let tokens: Vec<char> = output.chars().collect();
    let total_tokens = tokens.len();
    if total_tokens <= max_tokens {
        return (output.to_string(), None);
    }

    let half = max_tokens / 2;
    if half == 0 {
        let truncated = total_tokens.saturating_sub(max_tokens);
        let message = format!("…{truncated} tokens truncated…");
        return (message, Some(total_tokens));
    }

    let truncated = total_tokens.saturating_sub(half * 2);
    let mut truncated_output = String::new();
    truncated_output.extend(&tokens[..half]);
    truncated_output.push_str(&format!("…{truncated} tokens truncated…"));
    truncated_output.extend(&tokens[total_tokens - half..]);
    (truncated_output, Some(total_tokens))
}

#[cfg(test)]
#[cfg(unix)]
mod tests {
    use super::*;
    use crate::codex::Session;
    use crate::codex::TurnContext;
    use crate::codex::make_session_and_context;
    use crate::protocol::AskForApproval;
    use crate::protocol::SandboxPolicy;
    use crate::unified_exec::ExecCommandRequest;
    use crate::unified_exec::WriteStdinRequest;
    use core_test_support::skip_if_sandbox;
    use std::sync::Arc;
    use tokio::time::Duration;

    use super::session::OutputBufferState;

    fn test_session_and_turn() -> (Arc<Session>, Arc<TurnContext>) {
        let (session, mut turn) = make_session_and_context();
        turn.approval_policy = AskForApproval::Never;
        turn.sandbox_policy = SandboxPolicy::DangerFullAccess;
        (Arc::new(session), Arc::new(turn))
    }

    async fn exec_command(
        session: &Arc<Session>,
        turn: &Arc<TurnContext>,
        cmd: &str,
        yield_time_ms: Option<u64>,
    ) -> Result<UnifiedExecResponse, UnifiedExecError> {
        let context =
            UnifiedExecContext::new(Arc::clone(session), Arc::clone(turn), "call".to_string());

        session
            .services
            .unified_exec_manager
            .exec_command(
                ExecCommandRequest {
                    command: cmd,
                    shell: "/bin/bash",
                    login: true,
                    yield_time_ms,
                    max_output_tokens: None,
                    workdir: None,
                },
                &context,
            )
            .await
    }

    async fn write_stdin(
        session: &Arc<Session>,
        session_id: i32,
        input: &str,
        yield_time_ms: Option<u64>,
    ) -> Result<UnifiedExecResponse, UnifiedExecError> {
        session
            .services
            .unified_exec_manager
            .write_stdin(WriteStdinRequest {
                session_id,
                input,
                yield_time_ms,
                max_output_tokens: None,
            })
            .await
    }

    #[test]
    fn push_chunk_trims_only_excess_bytes() {
        let mut buffer = OutputBufferState::default();
        buffer.push_chunk(vec![b'a'; UNIFIED_EXEC_OUTPUT_MAX_BYTES]);
        buffer.push_chunk(vec![b'b']);
        buffer.push_chunk(vec![b'c']);

        assert_eq!(buffer.total_bytes, UNIFIED_EXEC_OUTPUT_MAX_BYTES);
        let snapshot = buffer.snapshot();
        assert_eq!(snapshot.len(), 3);
        assert_eq!(
            snapshot.first().unwrap().len(),
            UNIFIED_EXEC_OUTPUT_MAX_BYTES - 2
        );
        assert_eq!(snapshot.get(2).unwrap(), &vec![b'c']);
        assert_eq!(snapshot.get(1).unwrap(), &vec![b'b']);
    }

    #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
    async fn unified_exec_persists_across_requests() -> anyhow::Result<()> {
        skip_if_sandbox!(Ok(()));

        let (session, turn) = test_session_and_turn();

        let open_shell = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
        let session_id = open_shell.session_id.expect("expected session_id");

        write_stdin(
            &session,
            session_id,
            "export CODEX_INTERACTIVE_SHELL_VAR=codex\n",
            Some(2_500),
        )
        .await?;

        let out_2 = write_stdin(
            &session,
            session_id,
            "echo $CODEX_INTERACTIVE_SHELL_VAR\n",
            Some(2_500),
        )
        .await?;
        assert!(
            out_2.output.contains("codex"),
            "expected environment variable output"
        );

        Ok(())
    }

    #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
    async fn multi_unified_exec_sessions() -> anyhow::Result<()> {
        skip_if_sandbox!(Ok(()));

        let (session, turn) = test_session_and_turn();

        let shell_a = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
        let session_a = shell_a.session_id.expect("expected session id");

        write_stdin(
            &session,
            session_a,
            "export CODEX_INTERACTIVE_SHELL_VAR=codex\n",
            Some(2_500),
        )
        .await?;

        let out_2 = exec_command(
            &session,
            &turn,
            "echo $CODEX_INTERACTIVE_SHELL_VAR",
            Some(2_500),
        )
        .await?;
        assert!(
            out_2.session_id.is_none(),
            "short command should not retain a session"
        );
        assert!(
            !out_2.output.contains("codex"),
            "short command should run in a fresh shell"
        );

        let out_3 = write_stdin(
            &session,
            session_a,
            "echo $CODEX_INTERACTIVE_SHELL_VAR\n",
            Some(2_500),
        )
        .await?;
        assert!(
            out_3.output.contains("codex"),
            "session should preserve state"
        );

        Ok(())
    }

    #[tokio::test]
    async fn unified_exec_timeouts() -> anyhow::Result<()> {
        skip_if_sandbox!(Ok(()));

        let (session, turn) = test_session_and_turn();

        let open_shell = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
        let session_id = open_shell.session_id.expect("expected session id");

        write_stdin(
            &session,
            session_id,
            "export CODEX_INTERACTIVE_SHELL_VAR=codex\n",
            Some(2_500),
        )
        .await?;

        let out_2 = write_stdin(
            &session,
            session_id,
            "sleep 5 && echo $CODEX_INTERACTIVE_SHELL_VAR\n",
            Some(10),
        )
        .await?;
        assert!(
            !out_2.output.contains("codex"),
            "timeout too short should yield incomplete output"
        );

        tokio::time::sleep(Duration::from_secs(7)).await;

        let out_3 = write_stdin(&session, session_id, "", Some(100)).await?;

        assert!(
            out_3.output.contains("codex"),
            "subsequent poll should retrieve output"
        );

        Ok(())
    }

    #[tokio::test]
    #[ignore] // Ignored while we have a better way to test this.
    async fn requests_with_large_timeout_are_capped() -> anyhow::Result<()> {
        let (session, turn) = test_session_and_turn();

        let result = exec_command(&session, &turn, "echo codex", Some(120_000)).await?;

        assert!(result.session_id.is_none());
        assert!(result.output.contains("codex"));

        Ok(())
    }

    #[tokio::test]
    #[ignore] // Ignored while we have a better way to test this.
    async fn completed_commands_do_not_persist_sessions() -> anyhow::Result<()> {
        let (session, turn) = test_session_and_turn();
        let result = exec_command(&session, &turn, "echo codex", Some(2_500)).await?;

        assert!(
            result.session_id.is_none(),
            "completed command should not retain session"
        );
        assert!(result.output.contains("codex"));

        assert!(
            session
                .services
                .unified_exec_manager
                .sessions
                .lock()
                .await
                .is_empty()
        );

        Ok(())
    }

    #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
    async fn reusing_completed_session_returns_unknown_session() -> anyhow::Result<()> {
        skip_if_sandbox!(Ok(()));

        let (session, turn) = test_session_and_turn();

        let open_shell = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
        let session_id = open_shell.session_id.expect("expected session id");

        write_stdin(&session, session_id, "exit\n", Some(2_500)).await?;

        tokio::time::sleep(Duration::from_millis(200)).await;

        let err = write_stdin(&session, session_id, "", Some(100))
            .await
            .expect_err("expected unknown session error");

        match err {
            UnifiedExecError::UnknownSessionId { session_id: err_id } => {
                assert_eq!(err_id, session_id);
            }
            other => panic!("expected UnknownSessionId, got {other:?}"),
        }

        assert!(
            !session
                .services
                .unified_exec_manager
                .sessions
                .lock()
                .await
                .contains_key(&session_id)
        );

        Ok(())
    }
}
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								//! Unified Exec: interactive PTY execution orchestrated with approvals + sandboxing.
 								//!
 								//! Responsibilities
 								//! - Manages interactive PTY sessions (create, reuse, buffer output with caps).
 								//! - Uses the shared ToolOrchestrator to handle approval, sandbox selection, and
 								//!   retry semantics in a single, descriptive flow.
 								//! - Spawns the PTY from a sandbox‑transformed `ExecEnv`; on sandbox denial,
 								//!   retries without sandbox when policy allows (no re‑prompt thanks to caching).
 								//! - Uses the shared `is_likely_sandbox_denied` heuristic to keep denial messages
 								//!   consistent with other exec paths.
 								//!
 								//! Flow at a glance (open session)
 								//! 1) Build a small request `{ command, cwd }`.
 								//! 2) Orchestrator: approval (bypass/cache/prompt) → select sandbox → run.
 								//! 3) Runtime: transform `CommandSpec` → `ExecEnv` → spawn PTY.
 								//! 4) If denial, orchestrator retries with `SandboxType::None`.
 								//! 5) Session is returned with streaming output + metadata.
 								//!
 								//! This keeps policy logic and user interaction centralized while the PTY/session
 								//! concerns remain isolated here. The implementation is split between:
 								//! - `session.rs`: PTY session lifecycle + output buffering.
 								//! - `session_manager.rs`: orchestration (approvals, sandboxing, reuse) and request handling.
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								use std::collections::HashMap;
-												feat: end events on unified exec (#5551)


											
										
										
											2025-10-23 18:51:34 +01:00
+								use std::path::PathBuf;
 								use std::sync::Arc;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								use std::sync::atomic::AtomicI32;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								use std::time::Duration;
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								use rand::Rng;
 								use rand::rng;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								use tokio::sync::Mutex;
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								use crate::codex::Session;
 								use crate::codex::TurnContext;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								mod errors;
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								mod session;
 								mod session_manager;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								pub(crate) use errors::UnifiedExecError;
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								pub(crate) use session::UnifiedExecSession;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								pub(crate) const DEFAULT_YIELD_TIME_MS: u64 = 10_000;
 								pub(crate) const MIN_YIELD_TIME_MS: u64 = 250;
 								pub(crate) const MAX_YIELD_TIME_MS: u64 = 30_000;
 								pub(crate) const DEFAULT_MAX_OUTPUT_TOKENS: usize = 10_000;
 								pub(crate) const UNIFIED_EXEC_OUTPUT_MAX_BYTES: usize = 1024 * 1024; // 1 MiB
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												feat: end events on unified exec (#5551)


											
										
										
											2025-10-23 18:51:34 +01:00
+								pub(crate) struct UnifiedExecContext {
 								    pub session: Arc<Session>,
 								    pub turn: Arc<TurnContext>,
 								    pub call_id: String,
 								}
 								impl UnifiedExecContext {
 								    pub fn new(session: Arc<Session>, turn: Arc<TurnContext>, call_id: String) -> Self {
 								        Self {
 								            session,
 								            turn,
 								            call_id,
 								        }
 								    }
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								}
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								#[derive(Debug)]
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								pub(crate) struct ExecCommandRequest<'a> {
 								    pub command: &'a str,
 								    pub shell: &'a str,
 								    pub login: bool,
 								    pub yield_time_ms: Option<u64>,
 								    pub max_output_tokens: Option<usize>,
-												feat: add workdir to unified_exec (#6466)


											
										
										
											2025-11-10 19:53:36 +00:00
+								    pub workdir: Option<PathBuf>,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								}
 								#[derive(Debug)]
 								pub(crate) struct WriteStdinRequest<'a> {
 								    pub session_id: i32,
 								    pub input: &'a str,
 								    pub yield_time_ms: Option<u64>,
 								    pub max_output_tokens: Option<usize>,
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								}
 								#[derive(Debug, Clone, PartialEq)]
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								pub(crate) struct UnifiedExecResponse {
-												feat: end events on unified exec (#5551)


											
										
										
											2025-10-23 18:51:34 +01:00
+								    pub event_call_id: String,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								    pub chunk_id: String,
 								    pub wall_time: Duration,
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								    pub output: String,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								    pub session_id: Option<i32>,
 								    pub exit_code: Option<i32>,
 								    pub original_token_count: Option<usize>,
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								}
-												feat: end events on unified exec (#5551)


											
										
										
											2025-10-23 18:51:34 +01:00
+								#[derive(Default)]
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								pub(crate) struct UnifiedExecSessionManager {
 								    next_session_id: AtomicI32,
-												feat: end events on unified exec (#5551)


											
										
										
											2025-10-23 18:51:34 +01:00
+								    sessions: Mutex<HashMap<i32, SessionEntry>>,
 								}
 								struct SessionEntry {
 								    session: session::UnifiedExecSession,
 								    session_ref: Arc<Session>,
 								    turn_ref: Arc<TurnContext>,
 								    call_id: String,
 								    command: String,
 								    cwd: PathBuf,
 								    started_at: tokio::time::Instant,
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								}
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								pub(crate) fn clamp_yield_time(yield_time_ms: Option<u64>) -> u64 {
 								    match yield_time_ms {
 								        Some(value) => value.clamp(MIN_YIELD_TIME_MS, MAX_YIELD_TIME_MS),
 								        None => DEFAULT_YIELD_TIME_MS,
 								    }
 								}
 								pub(crate) fn resolve_max_tokens(max_tokens: Option<usize>) -> usize {
 								    max_tokens.unwrap_or(DEFAULT_MAX_OUTPUT_TOKENS)
 								}
 								pub(crate) fn generate_chunk_id() -> String {
 								    let mut rng = rng();
 								    (0..6)
 								        .map(|_| format!("{:x}", rng.random_range(0..16)))
 								        .collect()
 								}
 								pub(crate) fn truncate_output_to_tokens(
 								    output: &str,
 								    max_tokens: usize,
 								) -> (String, Option<usize>) {
 								    if max_tokens == 0 {
 								        let total_tokens = output.chars().count();
 								        let message = format!("…{total_tokens} tokens truncated…");
 								        return (message, Some(total_tokens));
 								    }
 								    let tokens: Vec<char> = output.chars().collect();
 								    let total_tokens = tokens.len();
 								    if total_tokens <= max_tokens {
 								        return (output.to_string(), None);
 								    }
 								    let half = max_tokens / 2;
 								    if half == 0 {
 								        let truncated = total_tokens.saturating_sub(max_tokens);
 								        let message = format!("…{truncated} tokens truncated…");
 								        return (message, Some(total_tokens));
 								    }
 								    let truncated = total_tokens.saturating_sub(half * 2);
 								    let mut truncated_output = String::new();
 								    truncated_output.extend(&tokens[..half]);
 								    truncated_output.push_str(&format!("…{truncated} tokens truncated…"));
 								    truncated_output.extend(&tokens[total_tokens - half..]);
 								    (truncated_output, Some(total_tokens))
 								}
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								#[cfg(test)]
 								#[cfg(unix)]
 								mod tests {
 								    use super::*;
 								    use crate::codex::Session;
 								    use crate::codex::TurnContext;
 								    use crate::codex::make_session_and_context;
 								    use crate::protocol::AskForApproval;
 								    use crate::protocol::SandboxPolicy;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								    use crate::unified_exec::ExecCommandRequest;
 								    use crate::unified_exec::WriteStdinRequest;
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    use core_test_support::skip_if_sandbox;
 								    use std::sync::Arc;
 								    use tokio::time::Duration;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    use super::session::OutputBufferState;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    fn test_session_and_turn() -> (Arc<Session>, Arc<TurnContext>) {
 								        let (session, mut turn) = make_session_and_context();
 								        turn.approval_policy = AskForApproval::Never;
 								        turn.sandbox_policy = SandboxPolicy::DangerFullAccess;
 								        (Arc::new(session), Arc::new(turn))
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								    }
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								    async fn exec_command(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        session: &Arc<Session>,
 								        turn: &Arc<TurnContext>,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        cmd: &str,
 								        yield_time_ms: Option<u64>,
 								    ) -> Result<UnifiedExecResponse, UnifiedExecError> {
-												feat: end events on unified exec (#5551)


											
										
										
											2025-10-23 18:51:34 +01:00
+								        let context =
 								            UnifiedExecContext::new(Arc::clone(session), Arc::clone(turn), "call".to_string());
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        session
 								            .services
 								            .unified_exec_manager
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            .exec_command(
 								                ExecCommandRequest {
 								                    command: cmd,
 								                    shell: "/bin/bash",
 								                    login: true,
 								                    yield_time_ms,
 								                    max_output_tokens: None,
-												feat: add workdir to unified_exec (#6466)


											
										
										
											2025-11-10 19:53:36 +00:00
+								                    workdir: None,
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								                },
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								                &context,
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            )
 								            .await
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								    }
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								    async fn write_stdin(
 								        session: &Arc<Session>,
 								        session_id: i32,
 								        input: &str,
 								        yield_time_ms: Option<u64>,
 								    ) -> Result<UnifiedExecResponse, UnifiedExecError> {
 								        session
 								            .services
 								            .unified_exec_manager
 								            .write_stdin(WriteStdinRequest {
 								                session_id,
 								                input,
 								                yield_time_ms,
 								                max_output_tokens: None,
 								            })
 								            .await
 								    }
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								    #[test]
 								    fn push_chunk_trims_only_excess_bytes() {
 								        let mut buffer = OutputBufferState::default();
 								        buffer.push_chunk(vec![b'a'; UNIFIED_EXEC_OUTPUT_MAX_BYTES]);
 								        buffer.push_chunk(vec![b'b']);
 								        buffer.push_chunk(vec![b'c']);
 								        assert_eq!(buffer.total_bytes, UNIFIED_EXEC_OUTPUT_MAX_BYTES);
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        let snapshot = buffer.snapshot();
 								        assert_eq!(snapshot.len(), 3);
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        assert_eq!(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            snapshot.first().unwrap().len(),
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								            UNIFIED_EXEC_OUTPUT_MAX_BYTES - 2
 								        );
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        assert_eq!(snapshot.get(2).unwrap(), &vec![b'c']);
 								        assert_eq!(snapshot.get(1).unwrap(), &vec![b'b']);
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								    }
 								    #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    async fn unified_exec_persists_across_requests() -> anyhow::Result<()> {
-												make tests pass cleanly in sandbox (#4067)

This changes the reqwest client used in tests to be sandbox-friendly,
and skips a bunch of other tests that don't work inside the
sandbox/without network.
											
										
										
											2025-09-25 13:11:14 -07:00
+								        skip_if_sandbox!(Ok(()));
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        let (session, turn) = test_session_and_turn();
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let open_shell = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        let session_id = open_shell.session_id.expect("expected session_id");
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        write_stdin(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            session_id,
 								            "export CODEX_INTERACTIVE_SHELL_VAR=codex\n",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(2_500),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let out_2 = write_stdin(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            session_id,
 								            "echo $CODEX_INTERACTIVE_SHELL_VAR\n",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(2_500),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(
 								            out_2.output.contains("codex"),
 								            "expected environment variable output"
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        Ok(())
 								    }
 								    #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    async fn multi_unified_exec_sessions() -> anyhow::Result<()> {
-												make tests pass cleanly in sandbox (#4067)

This changes the reqwest client used in tests to be sandbox-friendly,
and skips a bunch of other tests that don't work inside the
sandbox/without network.
											
										
										
											2025-09-25 13:11:14 -07:00
+								        skip_if_sandbox!(Ok(()));
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        let (session, turn) = test_session_and_turn();
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let shell_a = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        let session_a = shell_a.session_id.expect("expected session id");
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        write_stdin(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            session_a,
 								            "export CODEX_INTERACTIVE_SHELL_VAR=codex\n",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(2_500),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let out_2 = exec_command(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
 								            &turn,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            "echo $CODEX_INTERACTIVE_SHELL_VAR",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(2_500),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(
 								            out_2.session_id.is_none(),
 								            "short command should not retain a session"
 								        );
 								        assert!(
 								            !out_2.output.contains("codex"),
 								            "short command should run in a fresh shell"
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let out_3 = write_stdin(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            session_a,
 								            "echo $CODEX_INTERACTIVE_SHELL_VAR\n",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(2_500),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(
 								            out_3.output.contains("codex"),
 								            "session should preserve state"
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        Ok(())
 								    }
 								    #[tokio::test]
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    async fn unified_exec_timeouts() -> anyhow::Result<()> {
-												make tests pass cleanly in sandbox (#4067)

This changes the reqwest client used in tests to be sandbox-friendly,
and skips a bunch of other tests that don't work inside the
sandbox/without network.
											
										
										
											2025-09-25 13:11:14 -07:00
+								        skip_if_sandbox!(Ok(()));
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        let (session, turn) = test_session_and_turn();
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let open_shell = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        let session_id = open_shell.session_id.expect("expected session id");
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        write_stdin(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            session_id,
 								            "export CODEX_INTERACTIVE_SHELL_VAR=codex\n",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(2_500),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let out_2 = write_stdin(
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            &session,
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								            session_id,
 								            "sleep 5 && echo $CODEX_INTERACTIVE_SHELL_VAR\n",
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								            Some(10),
 								        )
 								        .await?;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(
 								            !out_2.output.contains("codex"),
 								            "timeout too short should yield incomplete output"
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        tokio::time::sleep(Duration::from_secs(7)).await;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let out_3 = write_stdin(&session, session_id, "", Some(100)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(
 								            out_3.output.contains("codex"),
 								            "subsequent poll should retrieve output"
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        Ok(())
 								    }
 								    #[tokio::test]
-												bug: Ignore tests for now (#3777)

Ignore flaky / long tests for now
											
										
										
											2025-09-18 10:43:45 +01:00
+								    #[ignore] // Ignored while we have a better way to test this.
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    async fn requests_with_large_timeout_are_capped() -> anyhow::Result<()> {
 								        let (session, turn) = test_session_and_turn();
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let result = exec_command(&session, &turn, "echo codex", Some(120_000)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(result.session_id.is_none());
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        assert!(result.output.contains("codex"));
 								        Ok(())
 								    }
 								    #[tokio::test]
-												bug: Ignore tests for now (#3777)

Ignore flaky / long tests for now
											
										
										
											2025-09-18 10:43:45 +01:00
+								    #[ignore] // Ignored while we have a better way to test this.
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    async fn completed_commands_do_not_persist_sessions() -> anyhow::Result<()> {
 								        let (session, turn) = test_session_and_turn();
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let result = exec_command(&session, &turn, "echo codex", Some(2_500)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        assert!(
 								            result.session_id.is_none(),
 								            "completed command should not retain session"
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        assert!(result.output.contains("codex"));
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        assert!(
 								            session
 								                .services
 								                .unified_exec_manager
 								                .sessions
 								                .lock()
 								                .await
 								                .is_empty()
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        Ok(())
 								    }
 								    #[tokio::test(flavor = "multi_thread", worker_threads = 2)]
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								    async fn reusing_completed_session_returns_unknown_session() -> anyhow::Result<()> {
-												make tests pass cleanly in sandbox (#4067)

This changes the reqwest client used in tests to be sandbox-friendly,
and skips a bunch of other tests that don't work inside the
sandbox/without network.
											
										
										
											2025-09-25 13:11:14 -07:00
+								        skip_if_sandbox!(Ok(()));
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        let (session, turn) = test_session_and_turn();
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let open_shell = exec_command(&session, &turn, "bash -i", Some(2_500)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
+								        let session_id = open_shell.session_id.expect("expected session id");
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        write_stdin(&session, session_id, "exit\n", Some(2_500)).await?;
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        tokio::time::sleep(Duration::from_millis(200)).await;
-												chore: align unified_exec (#5442)

Align `unified_exec` with b implementation
											
										
										
											2025-10-22 11:50:18 +01:00
+								        let err = write_stdin(&session, session_id, "", Some(100))
 								            .await
 								            .expect_err("expected unknown session error");
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        match err {
 								            UnifiedExecError::UnknownSessionId { session_id: err_id } => {
 								                assert_eq!(err_id, session_id);
 								            }
 								            other => panic!("expected UnknownSessionId, got {other:?}"),
 								        }
-												chore: rework tools execution workflow (#5278)

Re-work the tool execution flow. Read `orchestrator.rs` to understand
the structure
											
										
										
											2025-10-20 20:57:37 +01:00
+								        assert!(
 								            !session
 								                .services
 								                .unified_exec_manager
 								                .sessions
 								                .lock()
 								                .await
 								                .contains_key(&session_id)
 								        );
-												Unified execution (#3288)

## Unified PTY-Based Exec Tool

Note: this requires to have this flag in the config:
`use_experimental_unified_exec_tool=true`

- Adds a PTY-backed interactive exec feature (“unified_exec”) with
session reuse via
  session_id, bounded output (128 KiB), and timeout clamping (≤ 60 s).
- Protocol: introduces ResponseItem::UnifiedExec { session_id,
arguments, timeout_ms }.
- Tools: exposes unified_exec as a function tool (Responses API);
excluded from Chat
  Completions payload while still supported in tool lists.
- Path handling: resolves commands via PATH (or explicit paths), with
UTF‑8/newline‑aware
  truncation (truncate_middle).
- Tests: cover command parsing, path resolution, session
persistence/cleanup, multi‑session
  isolation, timeouts, and truncation behavior.
											
										
										
											2025-09-10 17:38:11 -07:00
 								        Ok(())
 								    }
 								}