codex-cli/tests/agent-cancel-prev-response.test.ts

import { describe, it, expect, vi } from "vitest";

// Stream that emits a function_call so the agent records a `lastResponseId`.
class StreamWithFunctionCall {
  public controller = { abort: vi.fn() };

  async *[Symbol.asyncIterator]() {
    // First, deliver the function call.
    yield {
      type: "response.output_item.done",
      item: {
        type: "function_call",
        id: "call123",
        name: "shell",
        arguments: JSON.stringify({ cmd: ["echo", "hi"] }),
      },
    } as any;

    // Then conclude the turn.
    yield {
      type: "response.completed",
      response: {
        id: "resp_func_call", // lastResponseId that would normally be stored
        status: "completed",
        output: [
          {
            type: "function_call",
            id: "call123",
            name: "shell",
            arguments: JSON.stringify({ cmd: ["echo", "hi"] }),
          },
        ],
      },
    } as any;
  }
}

vi.mock("openai", () => {
  const invocationBodies: Array<any> = [];
  let callNum = 0;
  class FakeOpenAI {
    public responses = {
      create: async (body: any) => {
        invocationBodies.push(body);
        callNum += 1;
        // First call streams a function_call, second call returns empty stream.
        if (callNum === 1) {
          return new StreamWithFunctionCall();
        }
        // Subsequent calls: empty stream.
        return new (class {
          public controller = { abort: vi.fn() };
          async *[Symbol.asyncIterator]() {
            /* no events */
          }
        })();
      },
    };
  }

  class APIConnectionTimeoutError extends Error {}

  return {
    __esModule: true,
    default: FakeOpenAI,
    APIConnectionTimeoutError,
    _test: {
      getBodies: () => invocationBodies,
    },
  };
});

// Stub helpers not relevant for this test.
vi.mock("../src/approvals.js", () => ({
  __esModule: true,
  alwaysApprovedCommands: new Set<string>(),
  canAutoApprove: () => ({ type: "auto-approve", runInSandbox: false }) as any,
}));

vi.mock("../src/format-command.js", () => ({
  __esModule: true,
  formatCommandForDisplay: (c: Array<string>) => c.join(" "),
}));

vi.mock("../src/utils/agent/log.js", () => ({
  __esModule: true,
  log: () => {},
  isLoggingEnabled: () => false,
}));

// Now import the agent.
import { AgentLoop } from "../src/utils/agent/agent-loop.js";

describe("cancel clears previous_response_id", () => {
  it("second run after cancel should NOT include previous_response_id", async () => {
    const { _test } = (await import("openai")) as any;

    const agent = new AgentLoop({
      model: "any",
      instructions: "",
      approvalPolicy: { mode: "auto" } as any,
      additionalWritableRoots: [],
      onItem: () => {},
      onLoading: () => {},
      getCommandConfirmation: async () => ({ review: "yes" }) as any,
      onLastResponseId: () => {},
      config: { model: "any", instructions: "", notify: false },
    });

    // First run that triggers a function_call, but we will cancel *before* the
    // turn completes so the tool result is never returned.
    agent.run([
      {
        type: "message",
        role: "user",
        content: [{ type: "input_text", text: "do something" }],
      },
    ] as any);
    // Give it a moment to receive the function_call.
    await new Promise((r) => setTimeout(r, 40));

    // Cancel (simulate ESC ESC).
    agent.cancel();

    // Second user input.
    await agent.run([
      {
        type: "message",
        role: "user",
        content: [{ type: "input_text", text: "new command" }],
      },
    ] as any);

    const bodies = _test.getBodies();
    expect(bodies.length).toBeGreaterThanOrEqual(2);

    // The *last* invocation belongs to the second run (after cancellation).
    const found = bodies.some(
      (b: any) =>
        Array.isArray(b.input) &&
        b.input.some(
          (i: any) =>
            i.type === "function_call_output" && i.call_id === "call123",
        ),
    );

    expect(found).toBe(true);
  });
});
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`import { describe, it, expect, vi } from "vitest";`

			// Stream that emits a function_call so the agent records a `lastResponseId`.
			`class StreamWithFunctionCall {`
			`public controller = { abort: vi.fn() };`

			`async *[Symbol.asyncIterator]() {`
			`// First, deliver the function call.`
			`yield {`
			`type: "response.output_item.done",`
			`item: {`
			`type: "function_call",`
			`id: "call123",`
			`name: "shell",`
			`arguments: JSON.stringify({ cmd: ["echo", "hi"] }),`
			`},`
			`} as any;`

			`// Then conclude the turn.`
			`yield {`
			`type: "response.completed",`
			`response: {`
			`id: "resp_func_call", // lastResponseId that would normally be stored`
			`status: "completed",`
			`output: [`
			`{`
			`type: "function_call",`
			`id: "call123",`
			`name: "shell",`
			`arguments: JSON.stringify({ cmd: ["echo", "hi"] }),`
			`},`
			`],`
			`},`
			`} as any;`
			`}`
			`}`

			`vi.mock("openai", () => {`
			`const invocationBodies: Array<any> = [];`
			`let callNum = 0;`
			`class FakeOpenAI {`
			`public responses = {`
			`create: async (body: any) => {`
			`invocationBodies.push(body);`
			`callNum += 1;`
			`// First call streams a function_call, second call returns empty stream.`
			`if (callNum === 1) {`
			`return new StreamWithFunctionCall();`
			`}`
			`// Subsequent calls: empty stream.`
			`return new (class {`
			`public controller = { abort: vi.fn() };`
			`async *[Symbol.asyncIterator]() {`
			`/* no events */`
			`}`
			`})();`
			`},`
			`};`
			`}`

			`class APIConnectionTimeoutError extends Error {}`

			`return {`
			`__esModule: true,`
			`default: FakeOpenAI,`
			`APIConnectionTimeoutError,`
			`_test: {`
			`getBodies: () => invocationBodies,`
			`},`
			`};`
			`});`

			`// Stub helpers not relevant for this test.`
Back out @lib indirection in tsconfig.json (#111) 2025-04-16 14:16:53 -07:00			`vi.mock("../src/approvals.js", () => ({`
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`__esModule: true,`
			`alwaysApprovedCommands: new Set<string>(),`
chore: upgrade prettier to v3 (#644) ## Description This PR addresses the following improvements: Unify Prettier Version: Currently, the Prettier version used in `/package.json` and `/codex-cli/package.json` are different. In this PR, we're updating both to use Prettier v3. - Prettier v3 introduces improved support for JavaScript and TypeScript. (e.g. the formatting scenario shown in the image below. This is more aligned with the TypeScript indentation standard). <img width="1126" alt="image" src="https://github.com/user-attachments/assets/6e237eb8-4553-4574-b336-ed9561c55370" /> Add Prettier Auto-Formatting in lint-staged: We've added a step to automatically run prettier --write on JavaScript and TypeScript files as part of the lint-staged process, before the ESLint checks. - This will help ensure that all committed code is properly formatted according to the project's Prettier configuration. 2025-04-25 22:21:50 +08:00			`canAutoApprove: () => ({ type: "auto-approve", runInSandbox: false }) as any,`
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`}));`

Back out @lib indirection in tsconfig.json (#111) 2025-04-16 14:16:53 -07:00			`vi.mock("../src/format-command.js", () => ({`
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`__esModule: true,`
			`formatCommandForDisplay: (c: Array<string>) => c.join(" "),`
			`}));`

			`vi.mock("../src/utils/agent/log.js", () => ({`
			`__esModule: true,`
			`log: () => {},`
			`isLoggingEnabled: () => false,`
			`}));`

			`// Now import the agent.`
			`import { AgentLoop } from "../src/utils/agent/agent-loop.js";`

			`describe("cancel clears previous_response_id", () => {`
			`it("second run after cancel should NOT include previous_response_id", async () => {`
			`const { _test } = (await import("openai")) as any;`

			`const agent = new AgentLoop({`
			`model: "any",`
			`instructions: "",`
			`approvalPolicy: { mode: "auto" } as any,`
add support for -w,--writable-root to add more writable roots for sandbox (#263) This adds support for a new flag, `-w,--writable-root`, that can be specified multiple times to _amend_ the list of folders that should be configured as "writable roots" by the sandbox used in `full-auto` mode. Values that are passed as relative paths will be resolved to absolute paths. Incidentally, this required updating a number of the `agent*.test.ts` files: it feels like some of the setup logic across those tests could be consolidated. In my testing, it seems that this might be slightly out of distribution for the model, as I had to explicitly tell it to run `apply_patch` and that it had the permissions to write those files (initially, it just showed me a diff and told me to apply it myself). Nevertheless, I think this is a good starting point. 2025-04-17 15:39:26 -07:00			`additionalWritableRoots: [],`
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`onItem: () => {},`
			`onLoading: () => {},`
chore: upgrade prettier to v3 (#644) ## Description This PR addresses the following improvements: Unify Prettier Version: Currently, the Prettier version used in `/package.json` and `/codex-cli/package.json` are different. In this PR, we're updating both to use Prettier v3. - Prettier v3 introduces improved support for JavaScript and TypeScript. (e.g. the formatting scenario shown in the image below. This is more aligned with the TypeScript indentation standard). <img width="1126" alt="image" src="https://github.com/user-attachments/assets/6e237eb8-4553-4574-b336-ed9561c55370" /> Add Prettier Auto-Formatting in lint-staged: We've added a step to automatically run prettier --write on JavaScript and TypeScript files as part of the lint-staged process, before the ESLint checks. - This will help ensure that all committed code is properly formatted according to the project's Prettier configuration. 2025-04-25 22:21:50 +08:00			`getCommandConfirmation: async () => ({ review: "yes" }) as any,`
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`onLastResponseId: () => {},`
feat: add notifications for MacOS using Applescript (#160) yolo'ed it with codex. Let me know if this looks good to you. https://github.com/openai/codex/issues/148 tested with: ``` npm run build:dev ``` <img width="377" alt="Screenshot 2025-04-16 at 18 12 01" src="https://github.com/user-attachments/assets/79aa799b-b0b9-479d-84f1-bfb83d34bfb9" /> 2025-04-17 16:19:26 -07:00			`config: { model: "any", instructions: "", notify: false },`
Initial commit Signed-off-by: Ilan Bigio <ilan@openai.com> 2025-04-16 12:56:08 -04:00			`});`

			`// First run that triggers a function_call, but we will cancel before the`
			`// turn completes so the tool result is never returned.`
			`agent.run([`
			`{`
			`type: "message",`
			`role: "user",`
			`content: [{ type: "input_text", text: "do something" }],`
			`},`
			`] as any);`
			`// Give it a moment to receive the function_call.`
			`await new Promise((r) => setTimeout(r, 40));`

			`// Cancel (simulate ESC ESC).`
			`agent.cancel();`

			`// Second user input.`
			`await agent.run([`
			`{`
			`type: "message",`
			`role: "user",`
			`content: [{ type: "input_text", text: "new command" }],`
			`},`
			`] as any);`

			`const bodies = _test.getBodies();`
			`expect(bodies.length).toBeGreaterThanOrEqual(2);`

			`// The last invocation belongs to the second run (after cancellation).`
			`const found = bodies.some(`
			`(b: any) =>`
			`Array.isArray(b.input) &&`
			`b.input.some(`
			`(i: any) =>`
			`i.type === "function_call_output" && i.call_id === "call123",`
			`),`
			`);`

			`expect(found).toBe(true);`
			`});`
			`});`