codex-cli/tests/agent-cancel-race.test.ts

import { describe, it, expect, vi } from "vitest";
// This test reproduces the real‑world issue where the user cancels the current
// task (Esc Esc) but the model’s response has already started to stream — the
// partial answer still shows up in the UI.

// --- Mocks -----------------------------------------------------------------

class FakeStream {
  public controller = { abort: vi.fn() };

  async *[Symbol.asyncIterator]() {
    // Introduce a delay to simulate network latency and allow for cancel() to be called
    await new Promise((resolve) => setTimeout(resolve, 10));

    // Mimic an assistant message containing the word "hello".
    // Our fix should prevent this from being emitted after cancel() is called
    yield {
      type: "response.output_item.done",
      item: {
        type: "message",
        role: "assistant",
        id: "m1",
        content: [{ type: "text", text: "hello" }],
      },
    } as any;

    yield {
      type: "response.completed",
      response: {
        id: "resp1",
        status: "completed",
        output: [
          {
            type: "message",
            role: "assistant",
            id: "m1",
            content: [{ type: "text", text: "hello" }],
          },
        ],
      },
    } as any;
  }
}

vi.mock("openai", () => {
  let callCount = 0;
  class FakeOpenAI {
    public responses = {
      create: async () => {
        callCount += 1;
        // Only the *first* stream yields "hello" so that any later answer
        // clearly comes from the canceled run.
        return callCount === 1
          ? new FakeStream()
          : new (class {
              public controller = { abort: vi.fn() };
              async *[Symbol.asyncIterator]() {
                // empty stream
              }
            })();
      },
    };
  }
  class APIConnectionTimeoutError extends Error {}
  return { __esModule: true, default: FakeOpenAI, APIConnectionTimeoutError };
});

// Stubs for external helpers referenced indirectly.
vi.mock("../src/approvals.js", () => ({
  __esModule: true,
  isSafeCommand: () => null,
}));
vi.mock("../src/format-command.js", () => ({
  __esModule: true,
  formatCommandForDisplay: (c: Array<string>) => c.join(" "),
}));

// Stub the logger to avoid file‑system side effects during tests.
import { AgentLoop } from "../src/utils/agent/agent-loop.js";

vi.mock("../src/utils/agent/log.js", () => ({
  __esModule: true,
  log: () => {},
  isLoggingEnabled: () => false,
}));

describe("Agent cancellation race", () => {
  // This test verifies our fix for the race condition where a cancelled message
  // could still appear after the user cancels a request.
  it("should not emit messages after cancel() is called", async () => {
    const items: Array<any> = [];

    const agent = new AgentLoop({
      additionalWritableRoots: [],
      model: "any",
      instructions: "",
      config: { model: "any", instructions: "", notify: false },
      approvalPolicy: { mode: "auto" } as any,
      onItem: (i) => items.push(i),
      onLoading: () => {},
      getCommandConfirmation: async () => ({ review: "yes" }) as any,
      onLastResponseId: () => {},
    });

    const input = [
      {
        type: "message",
        role: "user",
        content: [{ type: "input_text", text: "say hello" }],
      },
    ];

    agent.run(input as any);

    // Cancel after the stream has started.
    await new Promise((r) => setTimeout(r, 5));
    agent.cancel();

    // Immediately issue a new (empty) command to mimic the UI letting the user
    // type something else – this resets the agent state.
    agent.run([
      {
        type: "message",
        role: "user",
        content: [{ type: "input_text", text: "noop" }],
      },
    ] as any);

    // Give everything time to flush.
    await new Promise((r) => setTimeout(r, 40));

    const assistantMsg = items.find((i) => i.role === "assistant");
    // Our fix should prevent the assistant message from being delivered after cancel
    // Now that we've fixed it, the test should pass
    expect(assistantMsg).toBeUndefined();
  });
});
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								import { describe, it, expect, vi } from "vitest";
 								// This test reproduces the real‑world issue where the user cancels the current
 								// task (Esc Esc) but the model’s response has already started to stream — the
 								// partial answer still shows up in the UI.
 								// --- Mocks -----------------------------------------------------------------
 								class FakeStream {
 								  public controller = { abort: vi.fn() };
 								  async *[Symbol.asyncIterator]() {
-												perf: optimize token streaming with balanced approach (#635)

- Replace setTimeout(10ms) with queueMicrotask for immediate processing
- Add minimal 3ms setTimeout for rendering to maintain readable UX
- Reduces per-token delay while preserving streaming experience
- Add performance test to verify optimization works correctly

---------

Co-authored-by: Claude <noreply@anthropic.com>
Co-authored-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-25 19:49:38 +02:00
+								    // Introduce a delay to simulate network latency and allow for cancel() to be called
 								    await new Promise((resolve) => setTimeout(resolve, 10));
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    // Mimic an assistant message containing the word "hello".
-												perf: optimize token streaming with balanced approach (#635)

- Replace setTimeout(10ms) with queueMicrotask for immediate processing
- Add minimal 3ms setTimeout for rendering to maintain readable UX
- Reduces per-token delay while preserving streaming experience
- Add performance test to verify optimization works correctly

---------

Co-authored-by: Claude <noreply@anthropic.com>
Co-authored-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-25 19:49:38 +02:00
+								    // Our fix should prevent this from being emitted after cancel() is called
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    yield {
 								      type: "response.output_item.done",
 								      item: {
 								        type: "message",
 								        role: "assistant",
 								        id: "m1",
 								        content: [{ type: "text", text: "hello" }],
 								      },
 								    } as any;
 								    yield {
 								      type: "response.completed",
 								      response: {
 								        id: "resp1",
 								        status: "completed",
 								        output: [
 								          {
 								            type: "message",
 								            role: "assistant",
 								            id: "m1",
 								            content: [{ type: "text", text: "hello" }],
 								          },
 								        ],
 								      },
 								    } as any;
 								  }
 								}
 								vi.mock("openai", () => {
 								  let callCount = 0;
 								  class FakeOpenAI {
 								    public responses = {
 								      create: async () => {
 								        callCount += 1;
 								        // Only the *first* stream yields "hello" so that any later answer
 								        // clearly comes from the canceled run.
 								        return callCount === 1
 								          ? new FakeStream()
 								          : new (class {
 								              public controller = { abort: vi.fn() };
 								              async *[Symbol.asyncIterator]() {
 								                // empty stream
 								              }
 								            })();
 								      },
 								    };
 								  }
 								  class APIConnectionTimeoutError extends Error {}
 								  return { __esModule: true, default: FakeOpenAI, APIConnectionTimeoutError };
 								});
 								// Stubs for external helpers referenced indirectly.
-												Back out @lib indirection in tsconfig.json (#111)


											
										
										
											2025-04-16 14:16:53 -07:00
+								vi.mock("../src/approvals.js", () => ({
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  __esModule: true,
 								  isSafeCommand: () => null,
 								}));
-												Back out @lib indirection in tsconfig.json (#111)


											
										
										
											2025-04-16 14:16:53 -07:00
+								vi.mock("../src/format-command.js", () => ({
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  __esModule: true,
 								  formatCommandForDisplay: (c: Array<string>) => c.join(" "),
 								}));
 								// Stub the logger to avoid file‑system side effects during tests.
 								import { AgentLoop } from "../src/utils/agent/agent-loop.js";
 								vi.mock("../src/utils/agent/log.js", () => ({
 								  __esModule: true,
 								  log: () => {},
 								  isLoggingEnabled: () => false,
 								}));
 								describe("Agent cancellation race", () => {
-												perf: optimize token streaming with balanced approach (#635)

- Replace setTimeout(10ms) with queueMicrotask for immediate processing
- Add minimal 3ms setTimeout for rendering to maintain readable UX
- Reduces per-token delay while preserving streaming experience
- Add performance test to verify optimization works correctly

---------

Co-authored-by: Claude <noreply@anthropic.com>
Co-authored-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-25 19:49:38 +02:00
+								  // This test verifies our fix for the race condition where a cancelled message
 								  // could still appear after the user cancels a request.
 								  it("should not emit messages after cancel() is called", async () => {
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    const items: Array<any> = [];
 								    const agent = new AgentLoop({
-												add support for -w,--writable-root to add more writable roots for sandbox (#263)

This adds support for a new flag, `-w,--writable-root`, that can be
specified multiple times to _amend_ the list of folders that should be
configured as "writable roots" by the sandbox used in `full-auto` mode.
Values that are passed as relative paths will be resolved to absolute
paths.

Incidentally, this required updating a number of the `agent*.test.ts`
files: it feels like some of the setup logic across those tests could be
consolidated.

In my testing, it seems that this might be slightly out of distribution
for the model, as I had to explicitly tell it to run `apply_patch` and
that it had the permissions to write those files (initially, it just
showed me a diff and told me to apply it myself). Nevertheless, I think
this is a good starting point.
											
										
										
											2025-04-17 15:39:26 -07:00
+								      additionalWritableRoots: [],
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      model: "any",
 								      instructions: "",
-												feat: add notifications for MacOS using Applescript (#160)

yolo'ed it with codex. Let me know if this looks good to you.

https://github.com/openai/codex/issues/148

tested with:
```
npm run build:dev
```

<img width="377" alt="Screenshot 2025-04-16 at 18 12 01"
src="https://github.com/user-attachments/assets/79aa799b-b0b9-479d-84f1-bfb83d34bfb9"
/>
											
										
										
											2025-04-17 16:19:26 -07:00
+								      config: { model: "any", instructions: "", notify: false },
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      approvalPolicy: { mode: "auto" } as any,
 								      onItem: (i) => items.push(i),
 								      onLoading: () => {},
-												chore: upgrade prettier to v3 (#644)

## Description

This PR addresses the following improvements:

**Unify Prettier Version**: Currently, the Prettier version used in
`/package.json` and `/codex-cli/package.json` are different. In this PR,
we're updating both to use Prettier v3.

- Prettier v3 introduces improved support for JavaScript and TypeScript.
(e.g. the formatting scenario shown in the image below. This is more
aligned with the TypeScript indentation standard).

<img width="1126" alt="image"
src="https://github.com/user-attachments/assets/6e237eb8-4553-4574-b336-ed9561c55370"
/>

**Add Prettier Auto-Formatting in lint-staged**: We've added a step to
automatically run prettier --write on JavaScript and TypeScript files as
part of the lint-staged process, before the ESLint checks.

- This will help ensure that all committed code is properly formatted
according to the project's Prettier configuration.
											
										
										
											2025-04-25 22:21:50 +08:00
+								      getCommandConfirmation: async () => ({ review: "yes" }) as any,
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      onLastResponseId: () => {},
 								    });
 								    const input = [
 								      {
 								        type: "message",
 								        role: "user",
 								        content: [{ type: "input_text", text: "say hello" }],
 								      },
 								    ];
 								    agent.run(input as any);
 								    // Cancel after the stream has started.
 								    await new Promise((r) => setTimeout(r, 5));
 								    agent.cancel();
 								    // Immediately issue a new (empty) command to mimic the UI letting the user
 								    // type something else – this resets the agent state.
 								    agent.run([
 								      {
 								        type: "message",
 								        role: "user",
 								        content: [{ type: "input_text", text: "noop" }],
 								      },
 								    ] as any);
 								    // Give everything time to flush.
 								    await new Promise((r) => setTimeout(r, 40));
 								    const assistantMsg = items.find((i) => i.role === "assistant");
-												perf: optimize token streaming with balanced approach (#635)

- Replace setTimeout(10ms) with queueMicrotask for immediate processing
- Add minimal 3ms setTimeout for rendering to maintain readable UX
- Reduces per-token delay while preserving streaming experience
- Add performance test to verify optimization works correctly

---------

Co-authored-by: Claude <noreply@anthropic.com>
Co-authored-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-25 19:49:38 +02:00
+								    // Our fix should prevent the assistant message from being delivered after cancel
 								    // Now that we've fixed it, the test should pass
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    expect(assistantMsg).toBeUndefined();
 								  });
 								});