[3/3] Merge sequential exec commands (#2110)

This PR merges and dedupes sequential exec cells so they stack neatly on sequential lines rather than separate blocks. This is particularly useful because the model will often sed 200 lines of a file multiple times in a row and this nicely collapses them. https://github.com/user-attachments/assets/04cccda5-e2ba-4a97-a613-4547587aa15c Part 1: https://github.com/openai/codex/pull/2095 Part 2: https://github.com/openai/codex/pull/2097
2025-08-11 12:40:12 -07:00
parent 85e4f564a3
commit 4368f075d0
2 changed files with 315 additions and 33 deletions
--- a/codex-rs/tui/src/chatwidget.rs
+++ b/codex-rs/tui/src/chatwidget.rs
@@ -47,6 +47,7 @@ use crate::bottom_pane::BottomPaneParams;
 use crate::bottom_pane::CancellationEvent;
 use crate::bottom_pane::InputResult;
 use crate::history_cell::CommandOutput;
 use crate::history_cell::ExecCell;
 use crate::history_cell::HistoryCell;
 use crate::history_cell::PatchEventType;
 use crate::live_wrap::RowBuilder;
@@ -467,8 +468,6 @@ impl ChatWidget<'_> {
                cwd,
                parsed_cmd,
            }) => {
                // TODO: merge this into the active exec call.
                self.flush_active_exec_cell();
                self.finalize_active_stream();
                // Ensure the status indicator is visible while the command runs.
                self.bottom_pane
@@ -481,8 +480,19 @@ impl ChatWidget<'_> {
                        parsed_cmd: parsed_cmd.clone(),
                    },
                );
-                self.active_exec_cell =
+                let active_exec_cell = self.active_exec_cell.take();
-                    Some(HistoryCell::new_active_exec_command(command, parsed_cmd));
+                let merge_result = merge_cells(&command, &parsed_cmd, &active_exec_cell);
                self.active_exec_cell = match merge_result {
                    MergeResult::Merge(cell) => Some(cell),
                    MergeResult::Drop => active_exec_cell,
                    MergeResult::NewCell(cell) => {
                        if let Some(active) = active_exec_cell {
                            self.app_event_tx
                                .send(AppEvent::InsertHistory(active.plain_lines()));
                        }
                        Some(cell)
                    }
                }
            }
            EventMsg::ExecCommandEnd(ExecCommandEndEvent {
                call_id,
@@ -493,11 +503,15 @@ impl ChatWidget<'_> {
            }) => {
                // Compute summary before moving stdout into the history cell.
                let cmd = self.running_commands.remove(&call_id);
                let parsed_cmd = match &cmd {
                    Some(RunningCommand { parsed_cmd, .. }) => parsed_cmd.clone(),
                    _ => vec![],
                };
                if let Some(cmd) = cmd {
                    // Preserve any merged parsed commands already present on the
                    // active cell; otherwise, fall back to this command's parsed.
                    let parsed_cmd = match &self.active_exec_cell {
                        Some(HistoryCell::Exec(ExecCell { parsed, .. })) if !parsed.is_empty() => {
                            parsed.clone()
                        }
                        _ => cmd.parsed_cmd.clone(),
                    };
                    // Replace the active running cell with the finalized result,
                    // but keep it as the active cell so it can be merged with
                    // subsequent commands before being committed.
@@ -826,3 +840,240 @@ fn add_token_usage(current_usage: &TokenUsage, new_usage: &TokenUsage) -> TokenU
        total_tokens: current_usage.total_tokens + new_usage.total_tokens,
    }
 }
 enum MergeResult {
    Merge(HistoryCell),
    Drop,
    NewCell(HistoryCell),
 }
 // Determine whether to and how to merge two consecutive exec cells.
 fn merge_cells(
    new_command: &[String],
    new_parsed: &[ParsedCommand],
    active_exec_cell: &Option<HistoryCell>,
 ) -> MergeResult {
    let ExecCell {
        command: _existing_command,
        parsed: existing_parsed,
        output: existing_output,
    } = match active_exec_cell {
        Some(HistoryCell::Exec(cell)) => cell,
        _ => {
            // There is no existing exec cell.
            return MergeResult::NewCell(HistoryCell::new_active_exec_command(
                new_command.to_vec(),
                new_parsed.to_vec(),
            ));
        }
    };
    let existing_last = existing_parsed.last();
    let new_last = new_parsed.last();
    // Drop the first command if it is a read and matches the last command.
    // This is a common pattern the model does and it simplifies the output to dedupe.
    let drop_first = if let (
        Some(ParsedCommand::Read {
            name: existing_name,
            ..
        }),
        Some(ParsedCommand::Read { name: new_name, .. }),
    ) = (existing_last, new_last)
    {
        existing_name == new_name
    } else {
        false
    };
    if drop_first && new_parsed.len() == 1 {
        // There is only one command and it was deduped.
        return MergeResult::Drop;
    }
    let existing_exit_code = existing_output.as_ref().map(|o| o.exit_code);
    if let Some(code) = existing_exit_code {
        if code != 0 {
            // If the previous command failed, don't merge so the user can see stderr.
            // Start a fresh cell for the new command instead of duplicating the old one.
            return MergeResult::NewCell(HistoryCell::new_active_exec_command(
                new_command.to_vec(),
                new_parsed.to_vec(),
            ));
        }
    }
    let mut merged_parsed = existing_parsed.to_vec();
    if drop_first {
        merged_parsed.extend(new_parsed[1..].to_vec());
    } else {
        merged_parsed.extend(new_parsed.to_vec());
    }
    MergeResult::Merge(HistoryCell::new_active_exec_command(
        new_command.to_vec(),
        merged_parsed,
    ))
 }
 #[cfg(test)]
 mod tests {
    use super::*;
    use crate::history_cell::CommandOutput;
    fn read_cmd(name: &str) -> ParsedCommand {
        ParsedCommand::Read {
            cmd: vec!["cat".to_string(), name.to_string()],
            name: name.to_string(),
        }
    }
    fn unknown_cmd(cmd: &str) -> ParsedCommand {
        ParsedCommand::Unknown {
            cmd: cmd.split_whitespace().map(|s| s.to_string()).collect(),
        }
    }
    #[test]
    fn when_no_active_exec_cell_creates_new_cell() {
        let new_command = vec!["echo".to_string(), "hi".to_string()];
        let new_parsed = vec![read_cmd("a")];
        let result = merge_cells(&new_command, &new_parsed, &None);
        match result {
            MergeResult::NewCell(cell) => match cell {
                HistoryCell::Exec(ExecCell {
                    command,
                    parsed,
                    output,
                }) => {
                    assert_eq!(command, new_command);
                    assert_eq!(parsed, new_parsed);
                    assert!(output.is_none());
                }
                _ => panic!("expected Exec cell"),
            },
            _ => panic!("expected NewCell"),
        }
    }
    #[test]
    fn drops_duplicate_trailing_read_when_new_has_only_one_read() {
        // existing last = Read("foo"), new last = Read("foo"), new_parsed.len() == 1
        let active = Some(HistoryCell::new_active_exec_command(
            vec!["bash".into(), "-lc".into(), "cat foo".into()],
            vec![read_cmd("foo")],
        ));
        let new_command = vec!["cat".into(), "foo".into()];
        let new_parsed = vec![read_cmd("foo")];
        let result = merge_cells(&new_command, &new_parsed, &active);
        match result {
            MergeResult::Drop => {}
            _ => panic!("expected Drop"),
        }
    }
    #[test]
    fn does_not_merge_when_previous_command_failed() {
        // existing exit_code != 0 forces starting a fresh cell
        let active = Some(HistoryCell::new_completed_exec_command(
            vec!["bash".into(), "-lc".into(), "cat bar".into()],
            vec![read_cmd("bar")],
            CommandOutput {
                exit_code: 1,
                stdout: String::new(),
                stderr: "err".into(),
            },
        ));
        // Ensure drop_first condition is false (different name)
        let new_command = vec!["cat".into(), "baz".into()];
        let new_parsed = vec![read_cmd("baz")];
        let result = merge_cells(&new_command, &new_parsed, &active);
        match result {
            MergeResult::NewCell(cell) => match cell {
                HistoryCell::Exec(ExecCell {
                    command, parsed, ..
                }) => {
                    assert_eq!(command, new_command);
                    assert_eq!(parsed, new_parsed);
                }
                _ => panic!("expected Exec cell"),
            },
            _ => panic!("expected NewCell"),
        }
    }
    #[test]
    fn merges_with_drop_first_true_when_new_len_gt_one() {
        // existing last Read("file.txt"), new starts with same Read then more
        let active = Some(HistoryCell::new_active_exec_command(
            vec!["cat".into(), "file.txt".into()],
            vec![read_cmd("file.txt")],
        ));
        let new_command = vec!["bash".into(), "-lc".into(), "sed -n 1,20p file.txt".into()];
        // Place the duplicate Read as the LAST element to satisfy drop_first condition
        let leading = unknown_cmd("tail -n 20");
        let new_parsed = vec![leading.clone(), read_cmd("file.txt")];
        let result = merge_cells(&new_command, &new_parsed, &active);
        match result {
            MergeResult::Merge(cell) => match cell {
                HistoryCell::Exec(ExecCell {
                    command, parsed, ..
                }) => {
                    assert_eq!(command, new_command);
                    // Expect existing parsed + new_parsed[1..]
                    assert_eq!(parsed.len(), 2);
                    match (&parsed[0], &parsed[1]) {
                        (
                            ParsedCommand::Read { name, .. },
                            ParsedCommand::Read { name: n2, .. },
                        ) => {
                            assert_eq!(name, "file.txt");
                            assert_eq!(n2, "file.txt");
                        }
                        _ => panic!("unexpected parsed commands"),
                    }
                }
                _ => panic!("expected Exec cell"),
            },
            _ => panic!("expected Merge"),
        }
    }
    #[test]
    fn merges_without_drop_first_when_last_commands_differ() {
        // existing last Read("file1.txt"), new last Read("file2.txt"); should concatenate
        let active = Some(HistoryCell::new_active_exec_command(
            vec!["cat".into(), "file1.txt".into()],
            vec![read_cmd("file1.txt")],
        ));
        let new_command = vec!["bash".into(), "-lc".into(), "cat file2.txt".into()];
        let t2 = read_cmd("file2.txt");
        let extra = unknown_cmd("echo done");
        let new_parsed = vec![t2.clone(), extra.clone()];
        let result = merge_cells(&new_command, &new_parsed, &active);
        match result {
            MergeResult::Merge(cell) => match cell {
                HistoryCell::Exec(ExecCell {
                    command, parsed, ..
                }) => {
                    assert_eq!(command, new_command);
                    assert_eq!(parsed.len(), 3);
                    match (&parsed[0], &parsed[1], &parsed[2]) {
                        (ParsedCommand::Read { name: n1, .. }, p2, p3) => {
                            assert_eq!(n1, "file1.txt");
                            assert_eq!(p2, &t2);
                            assert_eq!(p3, &extra);
                        }
                        _ => panic!("unexpected parsed commands"),
                    }
                }
                _ => panic!("expected Exec cell"),
            },
            _ => panic!("expected Merge"),
        }
    }
 }
--- a/codex-rs/tui/src/history_cell.rs
+++ b/codex-rs/tui/src/history_cell.rs
@@ -38,6 +38,7 @@ use std::path::PathBuf;
 use std::time::Duration;
 use tracing::error;
 #[derive(Clone)]
 pub(crate) struct CommandOutput {
    pub(crate) exit_code: i32,
    pub(crate) stdout: String,
@@ -64,27 +65,37 @@ fn line_to_static(line: &Line) -> Line<'static> {
    }
 }
 pub(crate) struct ExecCell {
    pub(crate) command: Vec<String>,
    pub(crate) parsed: Vec<ParsedCommand>,
    pub(crate) output: Option<CommandOutput>,
 }
 /// Represents an event to display in the conversation history. Returns its
 /// `Vec<Line<'static>>` representation to make it easier to display in a
 /// scrollable list.
 pub(crate) enum HistoryCell {
    /// Welcome message.
-    WelcomeMessage { view: TextBlock },
+    WelcomeMessage {
-
+        view: TextBlock,
    /// Message from the user.
    UserPrompt { view: TextBlock },
    Exec {
        command: Vec<String>,
        parsed: Vec<ParsedCommand>,
        output: Option<CommandOutput>,
    },
    /// Message from the user.
    UserPrompt {
        view: TextBlock,
    },
    Exec(ExecCell),
    /// An MCP tool call that has not finished yet.
-    ActiveMcpToolCall { view: TextBlock },
+    ActiveMcpToolCall {
        view: TextBlock,
    },
    /// Completed MCP tool call where we show the result serialized as JSON.
-    CompletedMcpToolCall { view: TextBlock },
+    CompletedMcpToolCall {
        view: TextBlock,
    },
    /// Completed MCP tool call where the result is an image.
    /// Admittedly, [mcp_types::CallToolResult] can have multiple content types,
@@ -94,37 +105,57 @@ pub(crate) enum HistoryCell {
    // resized version avoids doing the potentially expensive rescale twice
    // because the scroll-view first calls `height()` for layouting and then
    // `render_window()` for painting.
-    CompletedMcpToolCallWithImageOutput { _image: DynamicImage },
+    CompletedMcpToolCallWithImageOutput {
        _image: DynamicImage,
    },
    /// Background event.
-    BackgroundEvent { view: TextBlock },
+    BackgroundEvent {
        view: TextBlock,
    },
    /// Output from the `/diff` command.
-    GitDiffOutput { view: TextBlock },
+    GitDiffOutput {
        view: TextBlock,
    },
    /// Output from the `/status` command.
-    StatusOutput { view: TextBlock },
+    StatusOutput {
        view: TextBlock,
    },
    /// Output from the `/prompts` command.
-    PromptsOutput { view: TextBlock },
+    PromptsOutput {
        view: TextBlock,
    },
    /// Error event from the backend.
-    ErrorEvent { view: TextBlock },
+    ErrorEvent {
        view: TextBlock,
    },
    /// Info describing the newly-initialized session.
-    SessionInfo { view: TextBlock },
+    SessionInfo {
        view: TextBlock,
    },
    /// A pending code patch that is awaiting user approval. Mirrors the
    /// behaviour of `ExecCell` so the user sees *what* patch the
    /// model wants to apply before being prompted to approve or deny it.
-    PendingPatch { view: TextBlock },
+    PendingPatch {
        view: TextBlock,
    },
    /// A human‑friendly rendering of the model's current plan and step
    /// statuses provided via the `update_plan` tool.
-    PlanUpdate { view: TextBlock },
+    PlanUpdate {
        view: TextBlock,
    },
    /// Result of applying a patch (success or failure) with optional output.
-    PatchApplyResult { view: TextBlock },
+    PatchApplyResult {
        view: TextBlock,
    },
 }
 const TOOL_CALL_MAX_LINES: usize = 5;
@@ -172,11 +203,11 @@ impl HistoryCell {
            | HistoryCell::ActiveMcpToolCall { view, .. } => {
                view.lines.iter().map(line_to_static).collect()
            }
-            HistoryCell::Exec {
+            HistoryCell::Exec(ExecCell {
                command,
                parsed,
                output,
-            } => HistoryCell::exec_command_lines(command, parsed, output.as_ref()),
+            }) => HistoryCell::exec_command_lines(command, parsed, output.as_ref()),
            HistoryCell::CompletedMcpToolCallWithImageOutput { .. } => vec![
                Line::from("tool result (image output omitted)"),
                Line::from(""),
@@ -279,11 +310,11 @@ impl HistoryCell {
        parsed: Vec<ParsedCommand>,
        output: Option<CommandOutput>,
    ) -> Self {
-        HistoryCell::Exec {
+        HistoryCell::Exec(ExecCell {
            command,
            parsed,
            output,
-        }
+        })
    }
    fn exec_command_lines(