codex-cli/src/utils/agent/agent-loop.ts

import type { ReviewDecision } from "./review.js";
import type { ApplyPatchCommand, ApprovalPolicy } from "../../approvals.js";
import type { AppConfig } from "../config.js";
import type { ResponseEvent } from "../responses.js";
import type {
  ResponseFunctionToolCall,
  ResponseInputItem,
  ResponseItem,
  ResponseCreateParams,
  FunctionTool,
} from "openai/resources/responses/responses.mjs";
import type { Reasoning } from "openai/resources.mjs";

import { OPENAI_TIMEOUT_MS, getApiKey, getBaseUrl } from "../config.js";
import { log } from "../logger/log.js";
import { parseToolCallArguments } from "../parsers.js";
import { responsesCreateViaChatCompletions } from "../responses.js";
import {
  ORIGIN,
  CLI_VERSION,
  getSessionId,
  setCurrentModel,
  setSessionId,
} from "../session.js";
import { handleExecCommand } from "./handle-exec-command.js";
import { randomUUID } from "node:crypto";
import OpenAI, { APIConnectionTimeoutError } from "openai";

// Wait time before retrying after rate limit errors (ms).
const RATE_LIMIT_RETRY_WAIT_MS = parseInt(
  process.env["OPENAI_RATE_LIMIT_RETRY_WAIT_MS"] || "2500",
  10,
);

export type CommandConfirmation = {
  review: ReviewDecision;
  applyPatch?: ApplyPatchCommand | undefined;
  customDenyMessage?: string;
  explanation?: string;
};

const alreadyProcessedResponses = new Set();

type AgentLoopParams = {
  model: string;
  provider?: string;
  config?: AppConfig;
  instructions?: string;
  approvalPolicy: ApprovalPolicy;
  /**
   * Whether the model responses should be stored on the server side (allows
   * using `previous_response_id` to provide conversational context). Defaults
   * to `true` to preserve the current behaviour. When set to `false` the agent
   * will instead send the *full* conversation context as the `input` payload
   * on every request and omit the `previous_response_id` parameter.
   */
  disableResponseStorage?: boolean;
  onItem: (item: ResponseItem) => void;
  onLoading: (loading: boolean) => void;

  /** Extra writable roots to use with sandbox execution. */
  additionalWritableRoots: ReadonlyArray<string>;

  /** Called when the command is not auto-approved to request explicit user review. */
  getCommandConfirmation: (
    command: Array<string>,
    applyPatch: ApplyPatchCommand | undefined,
  ) => Promise<CommandConfirmation>;
  onLastResponseId: (lastResponseId: string) => void;
};

const shellTool: FunctionTool = {
  type: "function",
  name: "shell",
  description: "Runs a shell command, and returns its output.",
  strict: false,
  parameters: {
    type: "object",
    properties: {
      command: { type: "array", items: { type: "string" } },
      workdir: {
        type: "string",
        description: "The working directory for the command.",
      },
      timeout: {
        type: "number",
        description:
          "The maximum time to wait for the command to complete in milliseconds.",
      },
    },
    required: ["command"],
    additionalProperties: false,
  },
};

export class AgentLoop {
  private model: string;
  private provider: string;
  private instructions?: string;
  private approvalPolicy: ApprovalPolicy;
  private config: AppConfig;
  private additionalWritableRoots: ReadonlyArray<string>;
  /** Whether we ask the API to persist conversation state on the server */
  private readonly disableResponseStorage: boolean;

  // Using `InstanceType<typeof OpenAI>` sidesteps typing issues with the OpenAI package under
  // the TS 5+ `moduleResolution=bundler` setup. OpenAI client instance. We keep the concrete
  // type to avoid sprinkling `any` across the implementation while still allowing paths where
  // the OpenAI SDK types may not perfectly match. The `typeof OpenAI` pattern captures the
  // instance shape without resorting to `any`.
  private oai: OpenAI;

  private onItem: (item: ResponseItem) => void;
  private onLoading: (loading: boolean) => void;
  private getCommandConfirmation: (
    command: Array<string>,
    applyPatch: ApplyPatchCommand | undefined,
  ) => Promise<CommandConfirmation>;
  private onLastResponseId: (lastResponseId: string) => void;

  /**
   * A reference to the currently active stream returned from the OpenAI
   * client. We keep this so that we can abort the request if the user decides
   * to interrupt the current task (e.g. via the escape hot‑key).
   */
  private currentStream: unknown | null = null;
  /** Incremented with every call to `run()`. Allows us to ignore stray events
   * from streams that belong to a previous run which might still be emitting
   * after the user has canceled and issued a new command. */
  private generation = 0;
  /** AbortController for in‑progress tool calls (e.g. shell commands). */
  private execAbortController: AbortController | null = null;
  /** Set to true when `cancel()` is called so `run()` can exit early. */
  private canceled = false;

  /**
   * Local conversation transcript used when `disableResponseStorage === true`. Holds
   * all non‑system items exchanged so far so we can provide full context on
   * every request.
   */
  private transcript: Array<ResponseInputItem> = [];
  /** Function calls that were emitted by the model but never answered because
   *  the user cancelled the run.  We keep the `call_id`s around so the *next*
   *  request can send a dummy `function_call_output` that satisfies the
   *  contract and prevents the
   *    400 | No tool output found for function call …
   *  error from OpenAI. */
  private pendingAborts: Set<string> = new Set();
  /** Set to true by `terminate()` – prevents any further use of the instance. */
  private terminated = false;
  /** Master abort controller – fires when terminate() is invoked. */
  private readonly hardAbort = new AbortController();

  /**
   * Abort the ongoing request/stream, if any. This allows callers (typically
   * the UI layer) to interrupt the current agent step so the user can issue
   * new instructions without waiting for the model to finish.
   */
  public cancel(): void {
    if (this.terminated) {
      return;
    }

    // Reset the current stream to allow new requests
    this.currentStream = null;
    log(
      `AgentLoop.cancel() invoked – currentStream=${Boolean(
        this.currentStream,
      )} execAbortController=${Boolean(this.execAbortController)} generation=${
        this.generation
      }`,
    );
    (
      this.currentStream as { controller?: { abort?: () => void } } | null
    )?.controller?.abort?.();

    this.canceled = true;

    // Abort any in-progress tool calls
    this.execAbortController?.abort();

    // Create a new abort controller for future tool calls
    this.execAbortController = new AbortController();
    log("AgentLoop.cancel(): execAbortController.abort() called");

    // NOTE: We intentionally do *not* clear `lastResponseId` here.  If the
    // stream produced a `function_call` before the user cancelled, OpenAI now
    // expects a corresponding `function_call_output` that must reference that
    // very same response ID.  We therefore keep the ID around so the
    // follow‑up request can still satisfy the contract.

    // If we have *not* seen any function_call IDs yet there is nothing that
    // needs to be satisfied in a follow‑up request.  In that case we clear
    // the stored lastResponseId so a subsequent run starts a clean turn.
    if (this.pendingAborts.size === 0) {
      try {
        this.onLastResponseId("");
      } catch {
        /* ignore */
      }
    }

    this.onLoading(false);

    /* Inform the UI that the run was aborted by the user. */
    // const cancelNotice: ResponseItem = {
    //   id: `cancel-${Date.now()}`,
    //   type: "message",
    //   role: "system",
    //   content: [
    //     {
    //       type: "input_text",
    //       text: "⏹️  Execution canceled by user.",
    //     },
    //   ],
    // };
    // this.onItem(cancelNotice);

    this.generation += 1;
    log(`AgentLoop.cancel(): generation bumped to ${this.generation}`);
  }

  /**
   * Hard‑stop the agent loop. After calling this method the instance becomes
   * unusable: any in‑flight operations are aborted and subsequent invocations
   * of `run()` will throw.
   */
  public terminate(): void {
    if (this.terminated) {
      return;
    }
    this.terminated = true;

    this.hardAbort.abort();

    this.cancel();
  }

  public sessionId: string;
  /*
   * Cumulative thinking time across this AgentLoop instance (ms).
   * Currently not used anywhere – comment out to keep the strict compiler
   * happy under `noUnusedLocals`.  Restore when telemetry support lands.
   */
  // private cumulativeThinkingMs = 0;
  constructor({
    model,
    provider = "openai",
    instructions,
    approvalPolicy,
    disableResponseStorage,
    // `config` used to be required.  Some unit‑tests (and potentially other
    // callers) instantiate `AgentLoop` without passing it, so we make it
    // optional and fall back to sensible defaults.  This keeps the public
    // surface backwards‑compatible and prevents runtime errors like
    // "Cannot read properties of undefined (reading 'apiKey')" when accessing
    // `config.apiKey` below.
    config,
    onItem,
    onLoading,
    getCommandConfirmation,
    onLastResponseId,
    additionalWritableRoots,
  }: AgentLoopParams & { config?: AppConfig }) {
    this.model = model;
    this.provider = provider;
    this.instructions = instructions;
    this.approvalPolicy = approvalPolicy;

    // If no `config` has been provided we derive a minimal stub so that the
    // rest of the implementation can rely on `this.config` always being a
    // defined object.  We purposefully copy over the `model` and
    // `instructions` that have already been passed explicitly so that
    // downstream consumers (e.g. telemetry) still observe the correct values.
    this.config =
      config ??
      ({
        model,
        instructions: instructions ?? "",
      } as AppConfig);
    this.additionalWritableRoots = additionalWritableRoots;
    this.onItem = onItem;
    this.onLoading = onLoading;
    this.getCommandConfirmation = getCommandConfirmation;
    this.onLastResponseId = onLastResponseId;

    this.disableResponseStorage = disableResponseStorage ?? false;
    this.sessionId = getSessionId() || randomUUID().replaceAll("-", "");
    // Configure OpenAI client with optional timeout (ms) from environment
    const timeoutMs = OPENAI_TIMEOUT_MS;
    const apiKey = getApiKey(this.provider);
    const baseURL = getBaseUrl(this.provider);

    this.oai = new OpenAI({
      // The OpenAI JS SDK only requires `apiKey` when making requests against
      // the official API.  When running unit‑tests we stub out all network
      // calls so an undefined key is perfectly fine.  We therefore only set
      // the property if we actually have a value to avoid triggering runtime
      // errors inside the SDK (it validates that `apiKey` is a non‑empty
      // string when the field is present).
      ...(apiKey ? { apiKey } : {}),
      baseURL,
      defaultHeaders: {
        originator: ORIGIN,
        version: CLI_VERSION,
        session_id: this.sessionId,
      },
      ...(timeoutMs !== undefined ? { timeout: timeoutMs } : {}),
    });

    setSessionId(this.sessionId);
    setCurrentModel(this.model);

    this.hardAbort = new AbortController();

    this.hardAbort.signal.addEventListener(
      "abort",
      () => this.execAbortController?.abort(),
      { once: true },
    );
  }

  private async handleFunctionCall(
    item: ResponseFunctionToolCall,
  ): Promise<Array<ResponseInputItem>> {
    // If the agent has been canceled in the meantime we should not perform any
    // additional work. Returning an empty array ensures that we neither execute
    // the requested tool call nor enqueue any follow‑up input items. This keeps
    // the cancellation semantics intuitive for users – once they interrupt a
    // task no further actions related to that task should be taken.
    if (this.canceled) {
      return [];
    }
    // ---------------------------------------------------------------------
    // Normalise the function‑call item into a consistent shape regardless of
    // whether it originated from the `/responses` or the `/chat/completions`
    // endpoint – their JSON differs slightly.
    // ---------------------------------------------------------------------

    const isChatStyle =
      // The chat endpoint nests function details under a `function` key.
      // We conservatively treat the presence of this field as a signal that
      // we are dealing with the chat format.
      // eslint-disable-next-line @typescript-eslint/no-explicit-any
      (item as any).function != null;

    const name: string | undefined = isChatStyle
      ? // eslint-disable-next-line @typescript-eslint/no-explicit-any
        (item as any).function?.name
      : // eslint-disable-next-line @typescript-eslint/no-explicit-any
        (item as any).name;

    const rawArguments: string | undefined = isChatStyle
      ? // eslint-disable-next-line @typescript-eslint/no-explicit-any
        (item as any).function?.arguments
      : // eslint-disable-next-line @typescript-eslint/no-explicit-any
        (item as any).arguments;

    // The OpenAI "function_call" item may have either `call_id` (responses
    // endpoint) or `id` (chat endpoint).  Prefer `call_id` if present but fall
    // back to `id` to remain compatible.
    // eslint-disable-next-line @typescript-eslint/no-explicit-any
    const callId: string = (item as any).call_id ?? (item as any).id;

    const args = parseToolCallArguments(rawArguments ?? "{}");
    log(
      `handleFunctionCall(): name=${
        name ?? "undefined"
      } callId=${callId} args=${rawArguments}`,
    );

    if (args == null) {
      const outputItem: ResponseInputItem.FunctionCallOutput = {
        type: "function_call_output",
        call_id: item.call_id,
        output: `invalid arguments: ${rawArguments}`,
      };
      return [outputItem];
    }

    const outputItem: ResponseInputItem.FunctionCallOutput = {
      type: "function_call_output",
      // `call_id` is mandatory – ensure we never send `undefined` which would
      // trigger the "No tool output found…" 400 from the API.
      call_id: callId,
      output: "no function found",
    };

    // We intentionally *do not* remove this `callId` from the `pendingAborts`
    // set right away.  The output produced below is only queued up for the
    // *next* request to the OpenAI API – it has not been delivered yet.  If
    // the user presses ESC‑ESC (i.e. invokes `cancel()`) in the small window
    // between queuing the result and the actual network call, we need to be
    // able to surface a synthetic `function_call_output` marked as
    // "aborted".  Keeping the ID in the set until the run concludes
    // successfully lets the next `run()` differentiate between an aborted
    // tool call (needs the synthetic output) and a completed one (cleared
    // below in the `flush()` helper).

    // used to tell model to stop if needed
    const additionalItems: Array<ResponseInputItem> = [];

    // TODO: allow arbitrary function calls (beyond shell/container.exec)
    if (name === "container.exec" || name === "shell") {
      const {
        outputText,
        metadata,
        additionalItems: additionalItemsFromExec,
      } = await handleExecCommand(
        args,
        this.config,
        this.approvalPolicy,
        this.additionalWritableRoots,
        this.getCommandConfirmation,
        this.execAbortController?.signal,
      );
      outputItem.output = JSON.stringify({ output: outputText, metadata });

      if (additionalItemsFromExec) {
        additionalItems.push(...additionalItemsFromExec);
      }
    }

    return [outputItem, ...additionalItems];
  }

  public async run(
    input: Array<ResponseInputItem>,
    previousResponseId: string = "",
  ): Promise<void> {
    // ---------------------------------------------------------------------
    // Top‑level error wrapper so that known transient network issues like
    // `ERR_STREAM_PREMATURE_CLOSE` do not crash the entire CLI process.
    // Instead we surface the failure to the user as a regular system‑message
    // and terminate the current run gracefully. The calling UI can then let
    // the user retry the request if desired.
    // ---------------------------------------------------------------------

    try {
      if (this.terminated) {
        throw new Error("AgentLoop has been terminated");
      }
      // Record when we start "thinking" so we can report accurate elapsed time.
      const thinkingStart = Date.now();
      // Bump generation so that any late events from previous runs can be
      // identified and dropped.
      const thisGeneration = ++this.generation;

      // Reset cancellation flag and stream for a fresh run.
      this.canceled = false;
      this.currentStream = null;

      // Create a fresh AbortController for this run so that tool calls from a
      // previous run do not accidentally get signalled.
      this.execAbortController = new AbortController();
      log(
        `AgentLoop.run(): new execAbortController created (${this.execAbortController.signal}) for generation ${this.generation}`,
      );
      // NOTE: We no longer (re‑)attach an `abort` listener to `hardAbort` here.
      // A single listener that forwards the `abort` to the current
      // `execAbortController` is installed once in the constructor. Re‑adding a
      // new listener on every `run()` caused the same `AbortSignal` instance to
      // accumulate listeners which in turn triggered Node's
      // `MaxListenersExceededWarning` after ten invocations.

      // Track the response ID from the last *stored* response so we can use
      // `previous_response_id` when `disableResponseStorage` is enabled.  When storage
      // is disabled we deliberately ignore the caller‑supplied value because
      // the backend will not retain any state that could be referenced.
      // If the backend stores conversation state (`disableResponseStorage === false`) we
      // forward the caller‑supplied `previousResponseId` so that the model sees the
      // full context.  When storage is disabled we *must not* send any ID because the
      // server no longer retains the referenced response.
      let lastResponseId: string = this.disableResponseStorage
        ? ""
        : previousResponseId;

      // If there are unresolved function calls from a previously cancelled run
      // we have to emit dummy tool outputs so that the API no longer expects
      // them.  We prepend them to the user‑supplied input so they appear
      // first in the conversation turn.
      const abortOutputs: Array<ResponseInputItem> = [];
      if (this.pendingAborts.size > 0) {
        for (const id of this.pendingAborts) {
          abortOutputs.push({
            type: "function_call_output",
            call_id: id,
            output: JSON.stringify({
              output: "aborted",
              metadata: { exit_code: 1, duration_seconds: 0 },
            }),
          } as ResponseInputItem.FunctionCallOutput);
        }
        // Once converted the pending list can be cleared.
        this.pendingAborts.clear();
      }

      // Build the input list for this turn. When responses are stored on the
      // server we can simply send the *delta* (the new user input as well as
      // any pending abort outputs) and rely on `previous_response_id` for
      // context.  When storage is disabled the server has no memory of the
      // conversation, so we must include the *entire* transcript (minus system
      // messages) on every call.

      let turnInput: Array<ResponseInputItem> = [];
      // Keeps track of how many items in `turnInput` stem from the existing
      // transcript so we can avoid re‑emitting them to the UI. Only used when
      // `disableResponseStorage === true`.
      let transcriptPrefixLen = 0;

      const stripInternalFields = (
        item: ResponseInputItem,
      ): ResponseInputItem => {
        // Clone shallowly and remove fields that are not part of the public
        // schema expected by the OpenAI Responses API.
        // We shallow‑clone the item so that subsequent mutations (deleting
        // internal fields) do not affect the original object which may still
        // be referenced elsewhere (e.g. UI components).
        const clean = { ...item } as Record<string, unknown>;
        delete clean["duration_ms"];
        // Remove OpenAI-assigned identifiers and transient status so the
        // backend does not reject items that were never persisted because we
        // use `store: false`.
        delete clean["id"];
        delete clean["status"];
        return clean as unknown as ResponseInputItem;
      };

      if (this.disableResponseStorage) {
        // Remember where the existing transcript ends – everything after this
        // index in the upcoming `turnInput` list will be *new* for this turn
        // and therefore needs to be surfaced to the UI.
        transcriptPrefixLen = this.transcript.length;

        // Ensure the transcript is up‑to‑date with the latest user input so
        // that subsequent iterations see a complete history.
        // `turnInput` is still empty at this point (it will be filled later).
        // We need to look at the *input* items the user just supplied.
        this.transcript.push(...filterToApiMessages(input));

        turnInput = [...this.transcript, ...abortOutputs].map(
          stripInternalFields,
        );
      } else {
        turnInput = [...abortOutputs, ...input].map(stripInternalFields);
      }

      this.onLoading(true);

      const staged: Array<ResponseItem | undefined> = [];
      const stageItem = (item: ResponseItem) => {
        // Ignore any stray events that belong to older generations.
        if (thisGeneration !== this.generation) {
          return;
        }

        // Store the item so the final flush can still operate on a complete list.
        // We'll nil out entries once they're delivered.
        const idx = staged.push(item) - 1;

        // Instead of emitting synchronously we schedule a short‑delay delivery.
        // This accomplishes two things:
        //   1. The UI still sees new messages almost immediately, creating the
        //      perception of real‑time updates.
        //   2. If the user calls `cancel()` in the small window right after the
        //      item was staged we can still abort the delivery because the
        //      generation counter will have been bumped by `cancel()`.
        setTimeout(() => {
          if (
            thisGeneration === this.generation &&
            !this.canceled &&
            !this.hardAbort.signal.aborted
          ) {
            this.onItem(item);
            // Mark as delivered so flush won't re-emit it
            staged[idx] = undefined;

            // When we operate without server‑side storage we keep our own
            // transcript so we can provide full context on subsequent calls.
            if (this.disableResponseStorage) {
              // Exclude system messages from transcript as they do not form
              // part of the assistant/user dialogue that the model needs.
              // eslint-disable-next-line @typescript-eslint/no-explicit-any
              const role = (item as any).role;
              if (role !== "system") {
                // Clone the item to avoid mutating the object that is also
                // rendered in the UI. We need to strip auxiliary metadata
                // such as `duration_ms` which is not part of the Responses
                // API schema and therefore causes a 400 error when included
                // in subsequent requests whose context is sent verbatim.

                // Skip items that we have already inserted earlier or that the
                // model does not need to see again in the next turn.
                //   • function_call   – superseded by the forthcoming
                //     function_call_output.
                //   • reasoning       – internal only, never sent back.
                //   • user messages   – we added these to the transcript when
                //     building the first turnInput; stageItem would add a
                //     duplicate.
                if (
                  (item as ResponseInputItem).type === "function_call" ||
                  (item as ResponseInputItem).type === "reasoning" ||
                  ((item as ResponseInputItem).type === "message" &&
                    // eslint-disable-next-line @typescript-eslint/no-explicit-any
                    (item as any).role === "user")
                ) {
                  return;
                }

                const clone: ResponseInputItem = {
                  ...(item as unknown as ResponseInputItem),
                } as ResponseInputItem;
                // The `duration_ms` field is only added to reasoning items to
                // show elapsed time in the UI. It must not be forwarded back
                // to the server.
                // eslint-disable-next-line @typescript-eslint/no-explicit-any
                delete (clone as any).duration_ms;

                this.transcript.push(clone);
              }
            }
          }
        }, 10);
      };

      while (turnInput.length > 0) {
        if (this.canceled || this.hardAbort.signal.aborted) {
          this.onLoading(false);
          return;
        }
        // send request to openAI
        // Only surface the *new* input items to the UI – replaying the entire
        // transcript would duplicate messages that have already been shown in
        // earlier turns.
        // `turnInput` holds the *new* items that will be sent to the API in
        // this iteration.  Surface exactly these to the UI so that we do not
        // re‑emit messages from previous turns (which would duplicate user
        // prompts) and so that freshly generated `function_call_output`s are
        // shown immediately.
        // Figure out what subset of `turnInput` constitutes *new* information
        // for the UI so that we don’t spam the interface with repeats of the
        // entire transcript on every iteration when response storage is
        // disabled.
        const deltaInput = this.disableResponseStorage
          ? turnInput.slice(transcriptPrefixLen)
          : [...turnInput];
        for (const item of deltaInput) {
          stageItem(item as ResponseItem);
        }
        // Send request to OpenAI with retry on timeout
        let stream;

        // Retry loop for transient errors. Up to MAX_RETRIES attempts.
        const MAX_RETRIES = 5;
        for (let attempt = 1; attempt <= MAX_RETRIES; attempt++) {
          try {
            let reasoning: Reasoning | undefined;
            if (this.model.startsWith("o")) {
              reasoning = { effort: "high" };
              if (this.model === "o3" || this.model === "o4-mini") {
                reasoning.summary = "auto";
              }
            }
            const mergedInstructions = [prefix, this.instructions]
              .filter(Boolean)
              .join("\n");

            const responseCall =
              !this.config.provider ||
              this.config.provider?.toLowerCase() === "openai"
                ? (params: ResponseCreateParams) =>
                    this.oai.responses.create(params)
                : (params: ResponseCreateParams) =>
                    responsesCreateViaChatCompletions(
                      this.oai,
                      params as ResponseCreateParams & { stream: true },
                    );
            log(
              `instructions (length ${mergedInstructions.length}): ${mergedInstructions}`,
            );

            // eslint-disable-next-line no-await-in-loop
            stream = await responseCall({
              model: this.model,
              instructions: mergedInstructions,
              input: turnInput,
              stream: true,
              parallel_tool_calls: false,
              reasoning,
              ...(this.config.flexMode ? { service_tier: "flex" } : {}),
              ...(this.disableResponseStorage
                ? { store: false }
                : {
                    store: true,
                    previous_response_id: lastResponseId || undefined,
                  }),
              tools: [shellTool],
              // Explicitly tell the model it is allowed to pick whatever
              // tool it deems appropriate.  Omitting this sometimes leads to
              // the model ignoring the available tools and responding with
              // plain text instead (resulting in a missing tool‑call).
              tool_choice: "auto",
            });
            break;
          } catch (error) {
            const isTimeout = error instanceof APIConnectionTimeoutError;
            // Lazily look up the APIConnectionError class at runtime to
            // accommodate the test environment's minimal OpenAI mocks which
            // do not define the class.  Falling back to `false` when the
            // export is absent ensures the check never throws.
            // eslint-disable-next-line @typescript-eslint/no-explicit-any
            const ApiConnErrCtor = (OpenAI as any).APIConnectionError as  // eslint-disable-next-line @typescript-eslint/no-explicit-any
              | (new (...args: any) => Error)
              | undefined;
            const isConnectionError = ApiConnErrCtor
              ? error instanceof ApiConnErrCtor
              : false;
            // eslint-disable-next-line @typescript-eslint/no-explicit-any
            const errCtx = error as any;
            const status =
              errCtx?.status ?? errCtx?.httpStatus ?? errCtx?.statusCode;
            const isServerError = typeof status === "number" && status >= 500;
            if (
              (isTimeout || isServerError || isConnectionError) &&
              attempt < MAX_RETRIES
            ) {
              log(
                `OpenAI request failed (attempt ${attempt}/${MAX_RETRIES}), retrying...`,
              );
              continue;
            }

            const isTooManyTokensError =
              (errCtx.param === "max_tokens" ||
                (typeof errCtx.message === "string" &&
                  /max_tokens is too large/i.test(errCtx.message))) &&
              errCtx.type === "invalid_request_error";

            if (isTooManyTokensError) {
              this.onItem({
                id: `error-${Date.now()}`,
                type: "message",
                role: "system",
                content: [
                  {
                    type: "input_text",
                    text: "⚠️  The current request exceeds the maximum context length supported by the chosen model. Please shorten the conversation, run /clear, or switch to a model with a larger context window and try again.",
                  },
                ],
              });
              this.onLoading(false);
              return;
            }

            const isRateLimit =
              status === 429 ||
              errCtx.code === "rate_limit_exceeded" ||
              errCtx.type === "rate_limit_exceeded" ||
              /rate limit/i.test(errCtx.message ?? "");
            if (isRateLimit) {
              if (attempt < MAX_RETRIES) {
                // Exponential backoff: base wait * 2^(attempt-1), or use suggested retry time
                // if provided.
                let delayMs = RATE_LIMIT_RETRY_WAIT_MS * 2 ** (attempt - 1);

                // Parse suggested retry time from error message, e.g., "Please try again in 1.3s"
                const msg = errCtx?.message ?? "";
                const m = /(?:retry|try) again in ([\d.]+)s/i.exec(msg);
                if (m && m[1]) {
                  const suggested = parseFloat(m[1]) * 1000;
                  if (!Number.isNaN(suggested)) {
                    delayMs = suggested;
                  }
                }
                log(
                  `OpenAI rate limit exceeded (attempt ${attempt}/${MAX_RETRIES}), retrying in ${Math.round(
                    delayMs,
                  )} ms...`,
                );
                // eslint-disable-next-line no-await-in-loop
                await new Promise((resolve) => setTimeout(resolve, delayMs));
                continue;
              } else {
                // We have exhausted all retry attempts. Surface a message so the user understands
                // why the request failed and can decide how to proceed (e.g. wait and retry later
                // or switch to a different model / account).

                const errorDetails = [
                  `Status: ${status || "unknown"}`,
                  `Code: ${errCtx.code || "unknown"}`,
                  `Type: ${errCtx.type || "unknown"}`,
                  `Message: ${errCtx.message || "unknown"}`,
                ].join(", ");

                this.onItem({
                  id: `error-${Date.now()}`,
                  type: "message",
                  role: "system",
                  content: [
                    {
                      type: "input_text",
                      text: `⚠️  Rate limit reached. Error details: ${errorDetails}. Please try again later.`,
                    },
                  ],
                });

                this.onLoading(false);
                return;
              }
            }

            const isClientError =
              (typeof status === "number" &&
                status >= 400 &&
                status < 500 &&
                status !== 429) ||
              errCtx.code === "invalid_request_error" ||
              errCtx.type === "invalid_request_error";
            if (isClientError) {
              this.onItem({
                id: `error-${Date.now()}`,
                type: "message",
                role: "system",
                content: [
                  {
                    type: "input_text",
                    // Surface the request ID when it is present on the error so users
                    // can reference it when contacting support or inspecting logs.
                    text: (() => {
                      const reqId =
                        (
                          errCtx as Partial<{
                            request_id?: string;
                            requestId?: string;
                          }>
                        )?.request_id ??
                        (
                          errCtx as Partial<{
                            request_id?: string;
                            requestId?: string;
                          }>
                        )?.requestId;

                      const errorDetails = [
                        `Status: ${status || "unknown"}`,
                        `Code: ${errCtx.code || "unknown"}`,
                        `Type: ${errCtx.type || "unknown"}`,
                        `Message: ${errCtx.message || "unknown"}`,
                      ].join(", ");

                      return `⚠️  OpenAI rejected the request${
                        reqId ? ` (request ID: ${reqId})` : ""
                      }. Error details: ${errorDetails}. Please verify your settings and try again.`;
                    })(),
                  },
                ],
              });
              this.onLoading(false);
              return;
            }
            throw error;
          }
        }

        // If the user requested cancellation while we were awaiting the network
        // request, abort immediately before we start handling the stream.
        if (this.canceled || this.hardAbort.signal.aborted) {
          // `stream` is defined; abort to avoid wasting tokens/server work
          try {
            (
              stream as { controller?: { abort?: () => void } }
            )?.controller?.abort?.();
          } catch {
            /* ignore */
          }
          this.onLoading(false);
          return;
        }

        // Keep track of the active stream so it can be aborted on demand.
        this.currentStream = stream;

        // guard against an undefined stream before iterating
        if (!stream) {
          this.onLoading(false);
          log("AgentLoop.run(): stream is undefined");
          return;
        }

        const MAX_STREAM_RETRIES = 5;
        let streamRetryAttempt = 0;

        // eslint-disable-next-line no-constant-condition
        while (true) {
          try {
            let newTurnInput: Array<ResponseInputItem> = [];

            // eslint-disable-next-line no-await-in-loop
            for await (const event of stream as AsyncIterable<ResponseEvent>) {
              log(`AgentLoop.run(): response event ${event.type}`);

              // process and surface each item (no-op until we can depend on streaming events)
              if (event.type === "response.output_item.done") {
                const item = event.item;
                // 1) if it's a reasoning item, annotate it
                type ReasoningItem = { type?: string; duration_ms?: number };
                const maybeReasoning = item as ReasoningItem;
                if (maybeReasoning.type === "reasoning") {
                  maybeReasoning.duration_ms = Date.now() - thinkingStart;
                }
                if (item.type === "function_call") {
                  // Track outstanding tool call so we can abort later if needed.
                  // The item comes from the streaming response, therefore it has
                  // either `id` (chat) or `call_id` (responses) – we normalise
                  // by reading both.
                  const callId =
                    (item as { call_id?: string; id?: string }).call_id ??
                    (item as { id?: string }).id;
                  if (callId) {
                    this.pendingAborts.add(callId);
                  }
                } else {
                  stageItem(item as ResponseItem);
                }
              }

              if (event.type === "response.completed") {
                if (thisGeneration === this.generation && !this.canceled) {
                  for (const item of event.response.output) {
                    stageItem(item as ResponseItem);
                  }
                }
                if (
                  event.response.status === "completed" ||
                  (event.response.status as unknown as string) ===
                    "requires_action"
                ) {
                  // TODO: remove this once we can depend on streaming events
                  newTurnInput = await this.processEventsWithoutStreaming(
                    event.response.output,
                    stageItem,
                  );

                  // When we do not use server‑side storage we maintain our
                  // own transcript so that *future* turns still contain full
                  // conversational context. However, whether we advance to
                  // another loop iteration should depend solely on the
                  // presence of *new* input items (i.e. items that were not
                  // part of the previous request). Re‑sending the transcript
                  // by itself would create an infinite request loop because
                  // `turnInput.length` would never reach zero.

                  if (this.disableResponseStorage) {
                    // 1) Append the freshly emitted output to our local
                    //    transcript (minus non‑message items the model does
                    //    not need to see again).
                    const cleaned = filterToApiMessages(
                      event.response.output.map(stripInternalFields),
                    );
                    this.transcript.push(...cleaned);

                    // 2) Determine the *delta* (newTurnInput) that must be
                    //    sent in the next iteration. If there is none we can
                    //    safely terminate the loop – the transcript alone
                    //    does not constitute new information for the
                    //    assistant to act upon.

                    const delta = filterToApiMessages(
                      newTurnInput.map(stripInternalFields),
                    );

                    if (delta.length === 0) {
                      // No new input => end conversation.
                      newTurnInput = [];
                    } else {
                      // Re‑send full transcript *plus* the new delta so the
                      // stateless backend receives complete context.
                      newTurnInput = [...this.transcript, ...delta];
                      // The prefix ends at the current transcript length –
                      // everything after this index is new for the next
                      // iteration.
                      transcriptPrefixLen = this.transcript.length;
                    }
                  }
                }
                lastResponseId = event.response.id;
                this.onLastResponseId(event.response.id);
              }
            }

            // Set after we have consumed all stream events in case the stream wasn't
            // complete or we missed events for whatever reason. That way, we will set
            // the next turn to an empty array to prevent an infinite loop.
            // And don't update the turn input too early otherwise we won't have the
            // current turn inputs available for retries.
            turnInput = newTurnInput;

            // Stream finished successfully – leave the retry loop.
            break;
          } catch (err: unknown) {
            const isRateLimitError = (e: unknown): boolean => {
              if (!e || typeof e !== "object") {
                return false;
              }
              // eslint-disable-next-line @typescript-eslint/no-explicit-any
              const ex: any = e;
              return (
                ex.status === 429 ||
                ex.code === "rate_limit_exceeded" ||
                ex.type === "rate_limit_exceeded"
              );
            };

            if (
              isRateLimitError(err) &&
              streamRetryAttempt < MAX_STREAM_RETRIES
            ) {
              streamRetryAttempt += 1;

              const waitMs =
                RATE_LIMIT_RETRY_WAIT_MS * 2 ** (streamRetryAttempt - 1);
              log(
                `OpenAI stream rate‑limited – retry ${streamRetryAttempt}/${MAX_STREAM_RETRIES} in ${waitMs} ms`,
              );

              // Give the server a breather before retrying.
              // eslint-disable-next-line no-await-in-loop
              await new Promise((res) => setTimeout(res, waitMs));

              // Re‑create the stream with the *same* parameters.
              let reasoning: Reasoning | undefined;
              if (this.model.startsWith("o")) {
                reasoning = { effort: "high" };
                if (this.model === "o3" || this.model === "o4-mini") {
                  reasoning.summary = "auto";
                }
              }

              const mergedInstructions = [prefix, this.instructions]
                .filter(Boolean)
                .join("\n");

              const responseCall =
                !this.config.provider ||
                this.config.provider?.toLowerCase() === "openai"
                  ? (params: ResponseCreateParams) =>
                      this.oai.responses.create(params)
                  : (params: ResponseCreateParams) =>
                      responsesCreateViaChatCompletions(
                        this.oai,
                        params as ResponseCreateParams & { stream: true },
                      );

              log(
                "agentLoop.run(): responseCall(1): turnInput: " +
                  JSON.stringify(turnInput),
              );
              // eslint-disable-next-line no-await-in-loop
              stream = await responseCall({
                model: this.model,
                instructions: mergedInstructions,
                input: turnInput,
                stream: true,
                parallel_tool_calls: false,
                reasoning,
                ...(this.config.flexMode ? { service_tier: "flex" } : {}),
                ...(this.disableResponseStorage
                  ? { store: false }
                  : {
                      store: true,
                      previous_response_id: lastResponseId || undefined,
                    }),
                tools: [shellTool],
                tool_choice: "auto",
              });

              this.currentStream = stream;
              // Continue to outer while to consume new stream.
              continue;
            }

            // Gracefully handle an abort triggered via `cancel()` so that the
            // consumer does not see an unhandled exception.
            if (err instanceof Error && err.name === "AbortError") {
              if (!this.canceled) {
                // It was aborted for some other reason; surface the error.
                throw err;
              }
              this.onLoading(false);
              return;
            }
            // Suppress internal stack on JSON parse failures
            if (err instanceof SyntaxError) {
              this.onItem({
                id: `error-${Date.now()}`,
                type: "message",
                role: "system",
                content: [
                  {
                    type: "input_text",
                    text: "⚠️ Failed to parse streaming response (invalid JSON). Please `/clear` to reset.",
                  },
                ],
              });
              this.onLoading(false);
              return;
            }
            // Handle OpenAI API quota errors
            if (
              err instanceof Error &&
              (err as { code?: string }).code === "insufficient_quota"
            ) {
              this.onItem({
                id: `error-${Date.now()}`,
                type: "message",
                role: "system",
                content: [
                  {
                    type: "input_text",
                    text: "⚠️ Insufficient quota. Please check your billing details and retry.",
                  },
                ],
              });
              this.onLoading(false);
              return;
            }
            throw err;
          } finally {
            this.currentStream = null;
          }
        } // end while retry loop

        log(
          `Turn inputs (${turnInput.length}) - ${turnInput
            .map((i) => i.type)
            .join(", ")}`,
        );
      }

      // Flush staged items if the run concluded successfully (i.e. the user did
      // not invoke cancel() or terminate() during the turn).
      const flush = () => {
        if (
          !this.canceled &&
          !this.hardAbort.signal.aborted &&
          thisGeneration === this.generation
        ) {
          // Only emit items that weren't already delivered above
          for (const item of staged) {
            if (item) {
              this.onItem(item);
            }
          }
        }

        // At this point the turn finished without the user invoking
        // `cancel()`.  Any outstanding function‑calls must therefore have been
        // satisfied, so we can safely clear the set that tracks pending aborts
        // to avoid emitting duplicate synthetic outputs in subsequent runs.
        this.pendingAborts.clear();
        // Now emit system messages recording the per‑turn *and* cumulative
        // thinking times so UIs and tests can surface/verify them.
        // const thinkingEnd = Date.now();

        // 1) Per‑turn measurement – exact time spent between request and
        //    response for *this* command.
        // this.onItem({
        //   id: `thinking-${thinkingEnd}`,
        //   type: "message",
        //   role: "system",
        //   content: [
        //     {
        //       type: "input_text",
        //       text: `🤔  Thinking time: ${Math.round(
        //         (thinkingEnd - thinkingStart) / 1000
        //       )} s`,
        //     },
        //   ],
        // });

        // 2) Session‑wide cumulative counter so users can track overall wait
        //    time across multiple turns.
        // this.cumulativeThinkingMs += thinkingEnd - thinkingStart;
        // this.onItem({
        //   id: `thinking-total-${thinkingEnd}`,
        //   type: "message",
        //   role: "system",
        //   content: [
        //     {
        //       type: "input_text",
        //       text: `⏱  Total thinking time: ${Math.round(
        //         this.cumulativeThinkingMs / 1000
        //       )} s`,
        //     },
        //   ],
        // });

        this.onLoading(false);
      };

      // Delay flush slightly to allow a near‑simultaneous cancel() to land.
      setTimeout(flush, 30);
      // End of main logic. The corresponding catch block for the wrapper at the
      // start of this method follows next.
    } catch (err) {
      // Handle known transient network/streaming issues so they do not crash the
      // CLI. We currently match Node/undici's `ERR_STREAM_PREMATURE_CLOSE`
      // error which manifests when the HTTP/2 stream terminates unexpectedly
      // (e.g. during brief network hiccups).

      const isPrematureClose =
        err instanceof Error &&
        // eslint-disable-next-line
        ((err as any).code === "ERR_STREAM_PREMATURE_CLOSE" ||
          err.message?.includes("Premature close"));

      if (isPrematureClose) {
        try {
          this.onItem({
            id: `error-${Date.now()}`,
            type: "message",
            role: "system",
            content: [
              {
                type: "input_text",
                text: "⚠️  Connection closed prematurely while waiting for the model. Please try again.",
              },
            ],
          });
        } catch {
          /* no-op – emitting the error message is best‑effort */
        }
        this.onLoading(false);
        return;
      }

      // -------------------------------------------------------------------
      // Catch‑all handling for other network or server‑side issues so that
      // transient failures do not crash the CLI. We intentionally keep the
      // detection logic conservative to avoid masking programming errors. A
      // failure is treated as retry‑worthy/user‑visible when any of the
      // following apply:
      //   • the error carries a recognised Node.js network errno ‑ style code
      //     (e.g. ECONNRESET, ETIMEDOUT …)
      //   • the OpenAI SDK attached an HTTP `status` >= 500 indicating a
      //     server‑side problem.
      //   • the error is model specific and detected in stream.
      // If matched we emit a single system message to inform the user and
      // resolve gracefully so callers can choose to retry.
      // -------------------------------------------------------------------

      const NETWORK_ERRNOS = new Set([
        "ECONNRESET",
        "ECONNREFUSED",
        "EPIPE",
        "ENOTFOUND",
        "ETIMEDOUT",
        "EAI_AGAIN",
      ]);

      const isNetworkOrServerError = (() => {
        if (!err || typeof err !== "object") {
          return false;
        }
        // eslint-disable-next-line @typescript-eslint/no-explicit-any
        const e: any = err;

        // Direct instance check for connection errors thrown by the OpenAI SDK.
        // eslint-disable-next-line @typescript-eslint/no-explicit-any
        const ApiConnErrCtor = (OpenAI as any).APIConnectionError as  // eslint-disable-next-line @typescript-eslint/no-explicit-any
          | (new (...args: any) => Error)
          | undefined;
        if (ApiConnErrCtor && e instanceof ApiConnErrCtor) {
          return true;
        }

        if (typeof e.code === "string" && NETWORK_ERRNOS.has(e.code)) {
          return true;
        }

        // When the OpenAI SDK nests the underlying network failure inside the
        // `cause` property we surface it as well so callers do not see an
        // unhandled exception for errors like ENOTFOUND, ECONNRESET …
        if (
          e.cause &&
          typeof e.cause === "object" &&
          NETWORK_ERRNOS.has((e.cause as { code?: string }).code ?? "")
        ) {
          return true;
        }

        if (typeof e.status === "number" && e.status >= 500) {
          return true;
        }

        // Fallback to a heuristic string match so we still catch future SDK
        // variations without enumerating every errno.
        if (
          typeof e.message === "string" &&
          /network|socket|stream/i.test(e.message)
        ) {
          return true;
        }

        return false;
      })();

      if (isNetworkOrServerError) {
        try {
          const msgText =
            "⚠️  Network error while contacting OpenAI. Please check your connection and try again.";
          this.onItem({
            id: `error-${Date.now()}`,
            type: "message",
            role: "system",
            content: [
              {
                type: "input_text",
                text: msgText,
              },
            ],
          });
        } catch {
          /* best‑effort */
        }
        this.onLoading(false);
        return;
      }

      const isInvalidRequestError = () => {
        if (!err || typeof err !== "object") {
          return false;
        }
        // eslint-disable-next-line @typescript-eslint/no-explicit-any
        const e: any = err;

        if (
          e.type === "invalid_request_error" &&
          e.code === "model_not_found"
        ) {
          return true;
        }

        if (
          e.cause &&
          e.cause.type === "invalid_request_error" &&
          e.cause.code === "model_not_found"
        ) {
          return true;
        }

        return false;
      };

      if (isInvalidRequestError()) {
        try {
          // Extract request ID and error details from the error object

          // eslint-disable-next-line @typescript-eslint/no-explicit-any
          const e: any = err;

          const reqId =
            e.request_id ??
            (e.cause && e.cause.request_id) ??
            (e.cause && e.cause.requestId);

          const errorDetails = [
            `Status: ${e.status || (e.cause && e.cause.status) || "unknown"}`,
            `Code: ${e.code || (e.cause && e.cause.code) || "unknown"}`,
            `Type: ${e.type || (e.cause && e.cause.type) || "unknown"}`,
            `Message: ${
              e.message || (e.cause && e.cause.message) || "unknown"
            }`,
          ].join(", ");

          const msgText = `⚠️  OpenAI rejected the request${
            reqId ? ` (request ID: ${reqId})` : ""
          }. Error details: ${errorDetails}. Please verify your settings and try again.`;

          this.onItem({
            id: `error-${Date.now()}`,
            type: "message",
            role: "system",
            content: [
              {
                type: "input_text",
                text: msgText,
              },
            ],
          });
        } catch {
          /* best-effort */
        }
        this.onLoading(false);
        return;
      }

      // Re‑throw all other errors so upstream handlers can decide what to do.
      throw err;
    }
  }

  // we need until we can depend on streaming events
  private async processEventsWithoutStreaming(
    output: Array<ResponseInputItem>,
    emitItem: (item: ResponseItem) => void,
  ): Promise<Array<ResponseInputItem>> {
    // If the agent has been canceled we should short‑circuit immediately to
    // avoid any further processing (including potentially expensive tool
    // calls). Returning an empty array ensures the main run‑loop terminates
    // promptly.
    if (this.canceled) {
      return [];
    }
    const turnInput: Array<ResponseInputItem> = [];
    for (const item of output) {
      if (item.type === "function_call") {
        if (alreadyProcessedResponses.has(item.id)) {
          continue;
        }
        alreadyProcessedResponses.add(item.id);
        // eslint-disable-next-line no-await-in-loop
        const result = await this.handleFunctionCall(item);
        turnInput.push(...result);
      }
      emitItem(item as ResponseItem);
    }
    return turnInput;
  }
}

const prefix = `You are operating as and within the Codex CLI, a terminal-based agentic coding assistant built by OpenAI. It wraps OpenAI models to enable natural language interaction with a local codebase. You are expected to be precise, safe, and helpful.

You can:
- Receive user prompts, project context, and files.
- Stream responses and emit function calls (e.g., shell commands, code edits).
- Apply patches, run commands, and manage user approvals based on policy.
- Work inside a sandboxed, git-backed workspace with rollback support.
- Log telemetry so sessions can be replayed or inspected later.
- More details on your functionality are available at \`codex --help\`

The Codex CLI is open-sourced. Don't confuse yourself with the old Codex language model built by OpenAI many moons ago (this is understandably top of mind for you!). Within this context, Codex refers to the open-source agentic coding interface.

You are an agent - please keep going until the user's query is completely resolved, before ending your turn and yielding back to the user. Only terminate your turn when you are sure that the problem is solved. If you are not sure about file content or codebase structure pertaining to the user's request, use your tools to read files and gather the relevant information: do NOT guess or make up an answer.

Please resolve the user's task by editing and testing the code files in your current code execution session. You are a deployed coding agent. Your session allows for you to modify and run code. The repo(s) are already cloned in your working directory, and you must fully solve the problem for your answer to be considered correct.

You MUST adhere to the following criteria when executing the task:
- Working on the repo(s) in the current environment is allowed, even if they are proprietary.
- Analyzing code for vulnerabilities is allowed.
- Showing user code and tool call details is allowed.
- User instructions may overwrite the *CODING GUIDELINES* section in this developer message.
- Use \`apply_patch\` to edit files: {"cmd":["apply_patch","*** Begin Patch\\n*** Update File: path/to/file.py\\n@@ def example():\\n-  pass\\n+  return 123\\n*** End Patch"]}
- If completing the user's task requires writing or modifying files:
    - Your code and final answer should follow these *CODING GUIDELINES*:
        - Fix the problem at the root cause rather than applying surface-level patches, when possible.
        - Avoid unneeded complexity in your solution.
            - Ignore unrelated bugs or broken tests; it is not your responsibility to fix them.
        - Update documentation as necessary.
        - Keep changes consistent with the style of the existing codebase. Changes should be minimal and focused on the task.
            - Use \`git log\` and \`git blame\` to search the history of the codebase if additional context is required; internet access is disabled.
        - NEVER add copyright or license headers unless specifically requested.
        - You do not need to \`git commit\` your changes; this will be done automatically for you.
        - If there is a .pre-commit-config.yaml, use \`pre-commit run --files ...\` to check that your changes pass the pre-commit checks. However, do not fix pre-existing errors on lines you didn't touch.
            - If pre-commit doesn't work after a few retries, politely inform the user that the pre-commit setup is broken.
        - Once you finish coding, you must
            - Check \`git status\` to sanity check your changes; revert any scratch files or changes.
            - Remove all inline comments you added as much as possible, even if they look normal. Check using \`git diff\`. Inline comments must be generally avoided, unless active maintainers of the repo, after long careful study of the code and the issue, will still misinterpret the code without the comments.
            - Check if you accidentally add copyright or license headers. If so, remove them.
            - Try to run pre-commit if it is available.
            - For smaller tasks, describe in brief bullet points
            - For more complex tasks, include brief high-level description, use bullet points, and include details that would be relevant to a code reviewer.
- If completing the user's task DOES NOT require writing or modifying files (e.g., the user asks a question about the code base):
    - Respond in a friendly tone as a remote teammate, who is knowledgeable, capable and eager to help with coding.
- When your task involves writing or modifying files:
    - Do NOT tell the user to "save the file" or "copy the code into a file" if you already created or modified the file using \`apply_patch\`. Instead, reference the file as already saved.
    - Do NOT show the full contents of large files you have already written, unless the user explicitly asks for them.`;

function filterToApiMessages(
  items: Array<ResponseInputItem>,
): Array<ResponseInputItem> {
  return items.filter((it) => {
    if (it.type === "message" && it.role === "system") {
      return false;
    }
    if (it.type === "reasoning") {
      return false;
    }
    return true;
  });
}
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								import type { ReviewDecision } from "./review.js";
-												Back out @lib indirection in tsconfig.json (#111)


											
										
										
											2025-04-16 14:16:53 -07:00
+								import type { ApplyPatchCommand, ApprovalPolicy } from "../../approvals.js";
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								import type { AppConfig } from "../config.js";
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								import type { ResponseEvent } from "../responses.js";
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								import type {
 								  ResponseFunctionToolCall,
 								  ResponseInputItem,
 								  ResponseItem,
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								  ResponseCreateParams,
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								  FunctionTool,
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								} from "openai/resources/responses/responses.mjs";
 								import type { Reasoning } from "openai/resources.mjs";
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								import { OPENAI_TIMEOUT_MS, getApiKey, getBaseUrl } from "../config.js";
-												chore: improve storage/ implementation; use log(...) consistently (#473)

This PR tidies up primitives under storage/.

**Noop changes:**

* Promote logger implementation to top-level utility outside of agent/
* Use logger within storage primitives
* Cleanup doc strings and comments

**Functional changes:**

* Increase command history size to 10_000
* Remove unnecessary debounce implementation and ensure a session ID is
created only once per agent loop

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-21 09:51:34 -04:00
+								import { log } from "../logger/log.js";
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								import { parseToolCallArguments } from "../parsers.js";
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								import { responsesCreateViaChatCompletions } from "../responses.js";
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								import {
 								  ORIGIN,
 								  CLI_VERSION,
 								  getSessionId,
 								  setCurrentModel,
 								  setSessionId,
 								} from "../session.js";
 								import { handleExecCommand } from "./handle-exec-command.js";
 								import { randomUUID } from "node:crypto";
 								import OpenAI, { APIConnectionTimeoutError } from "openai";
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								// Wait time before retrying after rate limit errors (ms).
 								const RATE_LIMIT_RETRY_WAIT_MS = parseInt(
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								  process.env["OPENAI_RATE_LIMIT_RETRY_WAIT_MS"] || "2500",
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+,
 								);
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								export type CommandConfirmation = {
 								  review: ReviewDecision;
 								  applyPatch?: ApplyPatchCommand | undefined;
 								  customDenyMessage?: string;
-												feat: shell command explanation option (#173)

# Shell Command Explanation Option

## Description
This PR adds an option to explain shell commands when the user is
prompted to approve them (Fixes #110). When reviewing a shell command,
users can now select "Explain this command" to get a detailed
explanation of what the command does before deciding whether to approve
or reject it.

## Changes
- Added a new "EXPLAIN" option to the `ReviewDecision` enum
- Updated the command review UI to include an "Explain this command (x)"
option
- Implemented the logic to send the command to the LLM for explanation
using the same model as the agent
- Added a display for the explanation in the command review UI
- Updated all relevant components to pass the explanation through the
component tree

## Benefits
- Improves user understanding of shell commands before approving them
- Reduces the risk of approving potentially harmful commands
- Enhances the educational aspect of the tool, helping users learn about
shell commands
- Maintains the same workflow with minimal UI changes

## Testing
- Manually tested the explanation feature with various shell commands
- Verified that the explanation is displayed correctly in the UI
- Confirmed that the user can still approve or reject the command after
viewing the explanation

## Screenshots

![improved_shell_explanation_demo](https://github.com/user-attachments/assets/05923481-29db-4eba-9cc6-5e92301d2be0)


## Additional Notes
The explanation is generated using the same model as the agent, ensuring
consistency in the quality and style of explanations.

---------

Signed-off-by: crazywolf132 <crazywolf132@gmail.com>
											
										
										
											2025-04-18 06:28:58 +10:00
+								  explanation?: string;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								};
 								const alreadyProcessedResponses = new Set();
 								type AgentLoopParams = {
 								  model: string;
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								  provider?: string;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  config?: AppConfig;
 								  instructions?: string;
 								  approvalPolicy: ApprovalPolicy;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								  /**
 								   * Whether the model responses should be stored on the server side (allows
 								   * using `previous_response_id` to provide conversational context). Defaults
 								   * to `true` to preserve the current behaviour. When set to `false` the agent
 								   * will instead send the *full* conversation context as the `input` payload
 								   * on every request and omit the `previous_response_id` parameter.
 								   */
 								  disableResponseStorage?: boolean;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  onItem: (item: ResponseItem) => void;
 								  onLoading: (loading: boolean) => void;
-												add support for -w,--writable-root to add more writable roots for sandbox (#263)

This adds support for a new flag, `-w,--writable-root`, that can be
specified multiple times to _amend_ the list of folders that should be
configured as "writable roots" by the sandbox used in `full-auto` mode.
Values that are passed as relative paths will be resolved to absolute
paths.

Incidentally, this required updating a number of the `agent*.test.ts`
files: it feels like some of the setup logic across those tests could be
consolidated.

In my testing, it seems that this might be slightly out of distribution
for the model, as I had to explicitly tell it to run `apply_patch` and
that it had the permissions to write those files (initially, it just
showed me a diff and told me to apply it myself). Nevertheless, I think
this is a good starting point.
											
										
										
											2025-04-17 15:39:26 -07:00
+								  /** Extra writable roots to use with sandbox execution. */
 								  additionalWritableRoots: ReadonlyArray<string>;
-												Add link to cookbook (#2)


											
										
										
											2025-04-16 10:15:46 -07:00
+								  /** Called when the command is not auto-approved to request explicit user review. */
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  getCommandConfirmation: (
 								    command: Array<string>,
 								    applyPatch: ApplyPatchCommand | undefined,
 								  ) => Promise<CommandConfirmation>;
 								  onLastResponseId: (lastResponseId: string) => void;
 								};
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								const shellTool: FunctionTool = {
 								  type: "function",
 								  name: "shell",
 								  description: "Runs a shell command, and returns its output.",
 								  strict: false,
 								  parameters: {
 								    type: "object",
 								    properties: {
 								      command: { type: "array", items: { type: "string" } },
 								      workdir: {
 								        type: "string",
 								        description: "The working directory for the command.",
 								      },
 								      timeout: {
 								        type: "number",
 								        description:
 								          "The maximum time to wait for the command to complete in milliseconds.",
 								      },
 								    },
 								    required: ["command"],
 								    additionalProperties: false,
 								  },
 								};
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								export class AgentLoop {
 								  private model: string;
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								  private provider: string;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  private instructions?: string;
 								  private approvalPolicy: ApprovalPolicy;
 								  private config: AppConfig;
-												add support for -w,--writable-root to add more writable roots for sandbox (#263)

This adds support for a new flag, `-w,--writable-root`, that can be
specified multiple times to _amend_ the list of folders that should be
configured as "writable roots" by the sandbox used in `full-auto` mode.
Values that are passed as relative paths will be resolved to absolute
paths.

Incidentally, this required updating a number of the `agent*.test.ts`
files: it feels like some of the setup logic across those tests could be
consolidated.

In my testing, it seems that this might be slightly out of distribution
for the model, as I had to explicitly tell it to run `apply_patch` and
that it had the permissions to write those files (initially, it just
showed me a diff and told me to apply it myself). Nevertheless, I think
this is a good starting point.
											
										
										
											2025-04-17 15:39:26 -07:00
+								  private additionalWritableRoots: ReadonlyArray<string>;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								  /** Whether we ask the API to persist conversation state on the server */
 								  private readonly disableResponseStorage: boolean;
-												Add link to cookbook (#2)


											
										
										
											2025-04-16 10:15:46 -07:00
 								  // Using `InstanceType<typeof OpenAI>` sidesteps typing issues with the OpenAI package under
 								  // the TS 5+ `moduleResolution=bundler` setup. OpenAI client instance. We keep the concrete
 								  // type to avoid sprinkling `any` across the implementation while still allowing paths where
 								  // the OpenAI SDK types may not perfectly match. The `typeof OpenAI` pattern captures the
 								  // instance shape without resorting to `any`.
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  private oai: OpenAI;
 								  private onItem: (item: ResponseItem) => void;
 								  private onLoading: (loading: boolean) => void;
 								  private getCommandConfirmation: (
 								    command: Array<string>,
 								    applyPatch: ApplyPatchCommand | undefined,
 								  ) => Promise<CommandConfirmation>;
 								  private onLastResponseId: (lastResponseId: string) => void;
 								  /**
 								   * A reference to the currently active stream returned from the OpenAI
 								   * client. We keep this so that we can abort the request if the user decides
 								   * to interrupt the current task (e.g. via the escape hot‑key).
 								   */
 								  private currentStream: unknown | null = null;
 								  /** Incremented with every call to `run()`. Allows us to ignore stray events
 								   * from streams that belong to a previous run which might still be emitting
 								   * after the user has canceled and issued a new command. */
 								  private generation = 0;
 								  /** AbortController for in‑progress tool calls (e.g. shell commands). */
 								  private execAbortController: AbortController | null = null;
 								  /** Set to true when `cancel()` is called so `run()` can exit early. */
 								  private canceled = false;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
 								  /**
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								   * Local conversation transcript used when `disableResponseStorage === true`. Holds
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								   * all non‑system items exchanged so far so we can provide full context on
 								   * every request.
 								   */
 								  private transcript: Array<ResponseInputItem> = [];
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  /** Function calls that were emitted by the model but never answered because
 								   *  the user cancelled the run.  We keep the `call_id`s around so the *next*
 								   *  request can send a dummy `function_call_output` that satisfies the
 								   *  contract and prevents the
 								   *    400 | No tool output found for function call …
 								   *  error from OpenAI. */
 								  private pendingAborts: Set<string> = new Set();
 								  /** Set to true by `terminate()` – prevents any further use of the instance. */
 								  private terminated = false;
 								  /** Master abort controller – fires when terminate() is invoked. */
 								  private readonly hardAbort = new AbortController();
 								  /**
 								   * Abort the ongoing request/stream, if any. This allows callers (typically
 								   * the UI layer) to interrupt the current agent step so the user can issue
 								   * new instructions without waiting for the model to finish.
 								   */
 								  public cancel(): void {
 								    if (this.terminated) {
 								      return;
 								    }
-												fix: allow continuing after interrupting assistant (#178)

## Description
This PR fixes the issue where the CLI can't continue after interrupting
the assistant with ESC ESC (Fixes #114). The problem was caused by
duplicate code in the `cancel()` method and improper state reset after
cancellation.

## Changes
- Fixed duplicate code in the `cancel()` method of the `AgentLoop` class
- Added proper reset of the `currentStream` property in the `cancel()`
method
- Created a new `AbortController` after aborting the current one to
ensure future tool calls work
- Added a system message to indicate the interruption to the user
- Added a comprehensive test to verify the fix

## Benefits
- Users can now continue using the CLI after interrupting the assistant
- Improved user experience by providing feedback when interruption
occurs
- Better state management in the agent loop

## Testing
- Added a dedicated test that verifies the agent can process new input
after cancellation
- Manually tested the fix by interrupting the assistant and confirming
that new input is processed correctly

---------

Signed-off-by: crazywolf132 <crazywolf132@gmail.com>
											
										
										
											2025-04-17 15:20:19 +10:00
 								    // Reset the current stream to allow new requests
 								    this.currentStream = null;
-												fix: remove unnecessary isLoggingEnabled() checks (#420)

It appears that use of `isLoggingEnabled()` was erroneously copypasta'd
in many places. This PR updates its docstring to clarify that should
only be used to avoid constructing a potentially expensive docstring.
With this change, the only function that merits/uses this check is
`execCommand()`.

---
[//]: # (BEGIN SAPLING FOOTER)
Stack created with [Sapling](https://sapling-scm.com). Best reviewed
with [ReviewStack](https://reviewstack.dev/openai/codex/pull/420).
* #423
* __->__ #420
* #419
											
										
										
											2025-04-20 09:58:06 -07:00
+								    log(
 								      `AgentLoop.cancel() invoked – currentStream=${Boolean(
 								        this.currentStream,
 								      )} execAbortController=${Boolean(this.execAbortController)} generation=${
 								        this.generation
 								      }`,
 								    );
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    (
 								      this.currentStream as { controller?: { abort?: () => void } } | null
 								    )?.controller?.abort?.();
 								    this.canceled = true;
-												fix: allow continuing after interrupting assistant (#178)

## Description
This PR fixes the issue where the CLI can't continue after interrupting
the assistant with ESC ESC (Fixes #114). The problem was caused by
duplicate code in the `cancel()` method and improper state reset after
cancellation.

## Changes
- Fixed duplicate code in the `cancel()` method of the `AgentLoop` class
- Added proper reset of the `currentStream` property in the `cancel()`
method
- Created a new `AbortController` after aborting the current one to
ensure future tool calls work
- Added a system message to indicate the interruption to the user
- Added a comprehensive test to verify the fix

## Benefits
- Users can now continue using the CLI after interrupting the assistant
- Improved user experience by providing feedback when interruption
occurs
- Better state management in the agent loop

## Testing
- Added a dedicated test that verifies the agent can process new input
after cancellation
- Manually tested the fix by interrupting the assistant and confirming
that new input is processed correctly

---------

Signed-off-by: crazywolf132 <crazywolf132@gmail.com>
											
										
										
											2025-04-17 15:20:19 +10:00
 								    // Abort any in-progress tool calls
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    this.execAbortController?.abort();
-												fix: allow continuing after interrupting assistant (#178)

## Description
This PR fixes the issue where the CLI can't continue after interrupting
the assistant with ESC ESC (Fixes #114). The problem was caused by
duplicate code in the `cancel()` method and improper state reset after
cancellation.

## Changes
- Fixed duplicate code in the `cancel()` method of the `AgentLoop` class
- Added proper reset of the `currentStream` property in the `cancel()`
method
- Created a new `AbortController` after aborting the current one to
ensure future tool calls work
- Added a system message to indicate the interruption to the user
- Added a comprehensive test to verify the fix

## Benefits
- Users can now continue using the CLI after interrupting the assistant
- Improved user experience by providing feedback when interruption
occurs
- Better state management in the agent loop

## Testing
- Added a dedicated test that verifies the agent can process new input
after cancellation
- Manually tested the fix by interrupting the assistant and confirming
that new input is processed correctly

---------

Signed-off-by: crazywolf132 <crazywolf132@gmail.com>
											
										
										
											2025-04-17 15:20:19 +10:00
 								    // Create a new abort controller for future tool calls
 								    this.execAbortController = new AbortController();
-												fix: remove unnecessary isLoggingEnabled() checks (#420)

It appears that use of `isLoggingEnabled()` was erroneously copypasta'd
in many places. This PR updates its docstring to clarify that should
only be used to avoid constructing a potentially expensive docstring.
With this change, the only function that merits/uses this check is
`execCommand()`.

---
[//]: # (BEGIN SAPLING FOOTER)
Stack created with [Sapling](https://sapling-scm.com). Best reviewed
with [ReviewStack](https://reviewstack.dev/openai/codex/pull/420).
* #423
* __->__ #420
* #419
											
										
										
											2025-04-20 09:58:06 -07:00
+								    log("AgentLoop.cancel(): execAbortController.abort() called");
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
 								    // NOTE: We intentionally do *not* clear `lastResponseId` here.  If the
 								    // stream produced a `function_call` before the user cancelled, OpenAI now
 								    // expects a corresponding `function_call_output` that must reference that
 								    // very same response ID.  We therefore keep the ID around so the
 								    // follow‑up request can still satisfy the contract.
 								    // If we have *not* seen any function_call IDs yet there is nothing that
 								    // needs to be satisfied in a follow‑up request.  In that case we clear
 								    // the stored lastResponseId so a subsequent run starts a clean turn.
 								    if (this.pendingAborts.size === 0) {
 								      try {
 								        this.onLastResponseId("");
 								      } catch {
 								        /* ignore */
 								      }
 								    }
 								    this.onLoading(false);
 								    /* Inform the UI that the run was aborted by the user. */
 								    // const cancelNotice: ResponseItem = {
 								    //   id: `cancel-${Date.now()}`,
 								    //   type: "message",
 								    //   role: "system",
 								    //   content: [
 								    //     {
 								    //       type: "input_text",
 								    //       text: "⏹️  Execution canceled by user.",
 								    //     },
 								    //   ],
 								    // };
 								    // this.onItem(cancelNotice);
 								    this.generation += 1;
-												fix: remove unnecessary isLoggingEnabled() checks (#420)

It appears that use of `isLoggingEnabled()` was erroneously copypasta'd
in many places. This PR updates its docstring to clarify that should
only be used to avoid constructing a potentially expensive docstring.
With this change, the only function that merits/uses this check is
`execCommand()`.

---
[//]: # (BEGIN SAPLING FOOTER)
Stack created with [Sapling](https://sapling-scm.com). Best reviewed
with [ReviewStack](https://reviewstack.dev/openai/codex/pull/420).
* #423
* __->__ #420
* #419
											
										
										
											2025-04-20 09:58:06 -07:00
+								    log(`AgentLoop.cancel(): generation bumped to ${this.generation}`);
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  }
 								  /**
 								   * Hard‑stop the agent loop. After calling this method the instance becomes
 								   * unusable: any in‑flight operations are aborted and subsequent invocations
 								   * of `run()` will throw.
 								   */
 								  public terminate(): void {
 								    if (this.terminated) {
 								      return;
 								    }
 								    this.terminated = true;
 								    this.hardAbort.abort();
 								    this.cancel();
 								  }
 								  public sessionId: string;
 								  /*
 								   * Cumulative thinking time across this AgentLoop instance (ms).
 								   * Currently not used anywhere – comment out to keep the strict compiler
 								   * happy under `noUnusedLocals`.  Restore when telemetry support lands.
 								   */
 								  // private cumulativeThinkingMs = 0;
 								  constructor({
 								    model,
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								    provider = "openai",
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    instructions,
 								    approvalPolicy,
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								    disableResponseStorage,
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    // `config` used to be required.  Some unit‑tests (and potentially other
 								    // callers) instantiate `AgentLoop` without passing it, so we make it
 								    // optional and fall back to sensible defaults.  This keeps the public
 								    // surface backwards‑compatible and prevents runtime errors like
 								    // "Cannot read properties of undefined (reading 'apiKey')" when accessing
 								    // `config.apiKey` below.
 								    config,
 								    onItem,
 								    onLoading,
 								    getCommandConfirmation,
 								    onLastResponseId,
-												add support for -w,--writable-root to add more writable roots for sandbox (#263)

This adds support for a new flag, `-w,--writable-root`, that can be
specified multiple times to _amend_ the list of folders that should be
configured as "writable roots" by the sandbox used in `full-auto` mode.
Values that are passed as relative paths will be resolved to absolute
paths.

Incidentally, this required updating a number of the `agent*.test.ts`
files: it feels like some of the setup logic across those tests could be
consolidated.

In my testing, it seems that this might be slightly out of distribution
for the model, as I had to explicitly tell it to run `apply_patch` and
that it had the permissions to write those files (initially, it just
showed me a diff and told me to apply it myself). Nevertheless, I think
this is a good starting point.
											
										
										
											2025-04-17 15:39:26 -07:00
+								    additionalWritableRoots,
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								  }: AgentLoopParams & { config?: AppConfig }) {
 								    this.model = model;
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								    this.provider = provider;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    this.instructions = instructions;
 								    this.approvalPolicy = approvalPolicy;
 								    // If no `config` has been provided we derive a minimal stub so that the
 								    // rest of the implementation can rely on `this.config` always being a
 								    // defined object.  We purposefully copy over the `model` and
 								    // `instructions` that have already been passed explicitly so that
 								    // downstream consumers (e.g. telemetry) still observe the correct values.
 								    this.config =
 								      config ??
 								      ({
 								        model,
 								        instructions: instructions ?? "",
 								      } as AppConfig);
-												add support for -w,--writable-root to add more writable roots for sandbox (#263)

This adds support for a new flag, `-w,--writable-root`, that can be
specified multiple times to _amend_ the list of folders that should be
configured as "writable roots" by the sandbox used in `full-auto` mode.
Values that are passed as relative paths will be resolved to absolute
paths.

Incidentally, this required updating a number of the `agent*.test.ts`
files: it feels like some of the setup logic across those tests could be
consolidated.

In my testing, it seems that this might be slightly out of distribution
for the model, as I had to explicitly tell it to run `apply_patch` and
that it had the permissions to write those files (initially, it just
showed me a diff and told me to apply it myself). Nevertheless, I think
this is a good starting point.
											
										
										
											2025-04-17 15:39:26 -07:00
+								    this.additionalWritableRoots = additionalWritableRoots;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    this.onItem = onItem;
 								    this.onLoading = onLoading;
 								    this.getCommandConfirmation = getCommandConfirmation;
 								    this.onLastResponseId = onLastResponseId;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
 								    this.disableResponseStorage = disableResponseStorage ?? false;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    this.sessionId = getSessionId() || randomUUID().replaceAll("-", "");
 								    // Configure OpenAI client with optional timeout (ms) from environment
 								    const timeoutMs = OPENAI_TIMEOUT_MS;
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								    const apiKey = getApiKey(this.provider);
 								    const baseURL = getBaseUrl(this.provider);
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								    this.oai = new OpenAI({
 								      // The OpenAI JS SDK only requires `apiKey` when making requests against
 								      // the official API.  When running unit‑tests we stub out all network
 								      // calls so an undefined key is perfectly fine.  We therefore only set
 								      // the property if we actually have a value to avoid triggering runtime
 								      // errors inside the SDK (it validates that `apiKey` is a non‑empty
 								      // string when the field is present).
 								      ...(apiKey ? { apiKey } : {}),
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								      baseURL,
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      defaultHeaders: {
 								        originator: ORIGIN,
 								        version: CLI_VERSION,
 								        session_id: this.sessionId,
 								      },
 								      ...(timeoutMs !== undefined ? { timeout: timeoutMs } : {}),
 								    });
 								    setSessionId(this.sessionId);
 								    setCurrentModel(this.model);
 								    this.hardAbort = new AbortController();
 								    this.hardAbort.signal.addEventListener(
 								      "abort",
 								      () => this.execAbortController?.abort(),
 								      { once: true },
 								    );
 								  }
 								  private async handleFunctionCall(
 								    item: ResponseFunctionToolCall,
 								  ): Promise<Array<ResponseInputItem>> {
 								    // If the agent has been canceled in the meantime we should not perform any
 								    // additional work. Returning an empty array ensures that we neither execute
 								    // the requested tool call nor enqueue any follow‑up input items. This keeps
 								    // the cancellation semantics intuitive for users – once they interrupt a
 								    // task no further actions related to that task should be taken.
 								    if (this.canceled) {
 								      return [];
 								    }
 								    // ---------------------------------------------------------------------
 								    // Normalise the function‑call item into a consistent shape regardless of
 								    // whether it originated from the `/responses` or the `/chat/completions`
 								    // endpoint – their JSON differs slightly.
 								    // ---------------------------------------------------------------------
 								    const isChatStyle =
 								      // The chat endpoint nests function details under a `function` key.
 								      // We conservatively treat the presence of this field as a signal that
 								      // we are dealing with the chat format.
 								      // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								      (item as any).function != null;
 								    const name: string | undefined = isChatStyle
 								      ? // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        (item as any).function?.name
 								      : // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        (item as any).name;
 								    const rawArguments: string | undefined = isChatStyle
 								      ? // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        (item as any).function?.arguments
 								      : // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        (item as any).arguments;
 								    // The OpenAI "function_call" item may have either `call_id` (responses
 								    // endpoint) or `id` (chat endpoint).  Prefer `call_id` if present but fall
 								    // back to `id` to remain compatible.
 								    // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								    const callId: string = (item as any).call_id ?? (item as any).id;
 								    const args = parseToolCallArguments(rawArguments ?? "{}");
-												fix: remove unnecessary isLoggingEnabled() checks (#420)

It appears that use of `isLoggingEnabled()` was erroneously copypasta'd
in many places. This PR updates its docstring to clarify that should
only be used to avoid constructing a potentially expensive docstring.
With this change, the only function that merits/uses this check is
`execCommand()`.

---
[//]: # (BEGIN SAPLING FOOTER)
Stack created with [Sapling](https://sapling-scm.com). Best reviewed
with [ReviewStack](https://reviewstack.dev/openai/codex/pull/420).
* #423
* __->__ #420
* #419
											
										
										
											2025-04-20 09:58:06 -07:00
+								    log(
 								      `handleFunctionCall(): name=${
 								        name ?? "undefined"
 								      } callId=${callId} args=${rawArguments}`,
 								    );
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
 								    if (args == null) {
 								      const outputItem: ResponseInputItem.FunctionCallOutput = {
 								        type: "function_call_output",
 								        call_id: item.call_id,
 								        output: `invalid arguments: ${rawArguments}`,
 								      };
 								      return [outputItem];
 								    }
 								    const outputItem: ResponseInputItem.FunctionCallOutput = {
 								      type: "function_call_output",
 								      // `call_id` is mandatory – ensure we never send `undefined` which would
 								      // trigger the "No tool output found…" 400 from the API.
 								      call_id: callId,
 								      output: "no function found",
 								    };
 								    // We intentionally *do not* remove this `callId` from the `pendingAborts`
 								    // set right away.  The output produced below is only queued up for the
 								    // *next* request to the OpenAI API – it has not been delivered yet.  If
 								    // the user presses ESC‑ESC (i.e. invokes `cancel()`) in the small window
 								    // between queuing the result and the actual network call, we need to be
 								    // able to surface a synthetic `function_call_output` marked as
 								    // "aborted".  Keeping the ID in the set until the run concludes
 								    // successfully lets the next `run()` differentiate between an aborted
 								    // tool call (needs the synthetic output) and a completed one (cleared
 								    // below in the `flush()` helper).
 								    // used to tell model to stop if needed
 								    const additionalItems: Array<ResponseInputItem> = [];
 								    // TODO: allow arbitrary function calls (beyond shell/container.exec)
 								    if (name === "container.exec" || name === "shell") {
 								      const {
 								        outputText,
 								        metadata,
 								        additionalItems: additionalItemsFromExec,
 								      } = await handleExecCommand(
 								        args,
 								        this.config,
 								        this.approvalPolicy,
-												add support for -w,--writable-root to add more writable roots for sandbox (#263)

This adds support for a new flag, `-w,--writable-root`, that can be
specified multiple times to _amend_ the list of folders that should be
configured as "writable roots" by the sandbox used in `full-auto` mode.
Values that are passed as relative paths will be resolved to absolute
paths.

Incidentally, this required updating a number of the `agent*.test.ts`
files: it feels like some of the setup logic across those tests could be
consolidated.

In my testing, it seems that this might be slightly out of distribution
for the model, as I had to explicitly tell it to run `apply_patch` and
that it had the permissions to write those files (initially, it just
showed me a diff and told me to apply it myself). Nevertheless, I think
this is a good starting point.
											
										
										
											2025-04-17 15:39:26 -07:00
+								        this.additionalWritableRoots,
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								        this.getCommandConfirmation,
 								        this.execAbortController?.signal,
 								      );
 								      outputItem.output = JSON.stringify({ output: outputText, metadata });
 								      if (additionalItemsFromExec) {
 								        additionalItems.push(...additionalItemsFromExec);
 								      }
 								    }
 								    return [outputItem, ...additionalItems];
 								  }
 								  public async run(
 								    input: Array<ResponseInputItem>,
 								    previousResponseId: string = "",
 								  ): Promise<void> {
 								    // ---------------------------------------------------------------------
 								    // Top‑level error wrapper so that known transient network issues like
 								    // `ERR_STREAM_PREMATURE_CLOSE` do not crash the entire CLI process.
 								    // Instead we surface the failure to the user as a regular system‑message
 								    // and terminate the current run gracefully. The calling UI can then let
 								    // the user retry the request if desired.
 								    // ---------------------------------------------------------------------
 								    try {
 								      if (this.terminated) {
 								        throw new Error("AgentLoop has been terminated");
 								      }
 								      // Record when we start "thinking" so we can report accurate elapsed time.
 								      const thinkingStart = Date.now();
 								      // Bump generation so that any late events from previous runs can be
 								      // identified and dropped.
 								      const thisGeneration = ++this.generation;
-												fix: allow continuing after interrupting assistant (#178)

## Description
This PR fixes the issue where the CLI can't continue after interrupting
the assistant with ESC ESC (Fixes #114). The problem was caused by
duplicate code in the `cancel()` method and improper state reset after
cancellation.

## Changes
- Fixed duplicate code in the `cancel()` method of the `AgentLoop` class
- Added proper reset of the `currentStream` property in the `cancel()`
method
- Created a new `AbortController` after aborting the current one to
ensure future tool calls work
- Added a system message to indicate the interruption to the user
- Added a comprehensive test to verify the fix

## Benefits
- Users can now continue using the CLI after interrupting the assistant
- Improved user experience by providing feedback when interruption
occurs
- Better state management in the agent loop

## Testing
- Added a dedicated test that verifies the agent can process new input
after cancellation
- Manually tested the fix by interrupting the assistant and confirming
that new input is processed correctly

---------

Signed-off-by: crazywolf132 <crazywolf132@gmail.com>
											
										
										
											2025-04-17 15:20:19 +10:00
+								      // Reset cancellation flag and stream for a fresh run.
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      this.canceled = false;
-												fix: allow continuing after interrupting assistant (#178)

## Description
This PR fixes the issue where the CLI can't continue after interrupting
the assistant with ESC ESC (Fixes #114). The problem was caused by
duplicate code in the `cancel()` method and improper state reset after
cancellation.

## Changes
- Fixed duplicate code in the `cancel()` method of the `AgentLoop` class
- Added proper reset of the `currentStream` property in the `cancel()`
method
- Created a new `AbortController` after aborting the current one to
ensure future tool calls work
- Added a system message to indicate the interruption to the user
- Added a comprehensive test to verify the fix

## Benefits
- Users can now continue using the CLI after interrupting the assistant
- Improved user experience by providing feedback when interruption
occurs
- Better state management in the agent loop

## Testing
- Added a dedicated test that verifies the agent can process new input
after cancellation
- Manually tested the fix by interrupting the assistant and confirming
that new input is processed correctly

---------

Signed-off-by: crazywolf132 <crazywolf132@gmail.com>
											
										
										
											2025-04-17 15:20:19 +10:00
+								      this.currentStream = null;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      // Create a fresh AbortController for this run so that tool calls from a
 								      // previous run do not accidentally get signalled.
 								      this.execAbortController = new AbortController();
-												fix: remove unnecessary isLoggingEnabled() checks (#420)

It appears that use of `isLoggingEnabled()` was erroneously copypasta'd
in many places. This PR updates its docstring to clarify that should
only be used to avoid constructing a potentially expensive docstring.
With this change, the only function that merits/uses this check is
`execCommand()`.

---
[//]: # (BEGIN SAPLING FOOTER)
Stack created with [Sapling](https://sapling-scm.com). Best reviewed
with [ReviewStack](https://reviewstack.dev/openai/codex/pull/420).
* #423
* __->__ #420
* #419
											
										
										
											2025-04-20 09:58:06 -07:00
+								      log(
 								        `AgentLoop.run(): new execAbortController created (${this.execAbortController.signal}) for generation ${this.generation}`,
 								      );
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      // NOTE: We no longer (re‑)attach an `abort` listener to `hardAbort` here.
 								      // A single listener that forwards the `abort` to the current
 								      // `execAbortController` is installed once in the constructor. Re‑adding a
 								      // new listener on every `run()` caused the same `AbortSignal` instance to
 								      // accumulate listeners which in turn triggered Node's
 								      // `MaxListenersExceededWarning` after ten invocations.
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								      // Track the response ID from the last *stored* response so we can use
 								      // `previous_response_id` when `disableResponseStorage` is enabled.  When storage
 								      // is disabled we deliberately ignore the caller‑supplied value because
 								      // the backend will not retain any state that could be referenced.
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								      // If the backend stores conversation state (`disableResponseStorage === false`) we
 								      // forward the caller‑supplied `previousResponseId` so that the model sees the
 								      // full context.  When storage is disabled we *must not* send any ID because the
 								      // server no longer retains the referenced response.
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								      let lastResponseId: string = this.disableResponseStorage
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								        ? ""
 								        : previousResponseId;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
 								      // If there are unresolved function calls from a previously cancelled run
 								      // we have to emit dummy tool outputs so that the API no longer expects
 								      // them.  We prepend them to the user‑supplied input so they appear
 								      // first in the conversation turn.
 								      const abortOutputs: Array<ResponseInputItem> = [];
 								      if (this.pendingAborts.size > 0) {
 								        for (const id of this.pendingAborts) {
 								          abortOutputs.push({
 								            type: "function_call_output",
 								            call_id: id,
 								            output: JSON.stringify({
 								              output: "aborted",
 								              metadata: { exit_code: 1, duration_seconds: 0 },
 								            }),
 								          } as ResponseInputItem.FunctionCallOutput);
 								        }
 								        // Once converted the pending list can be cleared.
 								        this.pendingAborts.clear();
 								      }
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								      // Build the input list for this turn. When responses are stored on the
 								      // server we can simply send the *delta* (the new user input as well as
 								      // any pending abort outputs) and rely on `previous_response_id` for
 								      // context.  When storage is disabled the server has no memory of the
 								      // conversation, so we must include the *entire* transcript (minus system
 								      // messages) on every call.
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								      let turnInput: Array<ResponseInputItem> = [];
 								      // Keeps track of how many items in `turnInput` stem from the existing
 								      // transcript so we can avoid re‑emitting them to the UI. Only used when
 								      // `disableResponseStorage === true`.
 								      let transcriptPrefixLen = 0;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
 								      const stripInternalFields = (
 								        item: ResponseInputItem,
 								      ): ResponseInputItem => {
 								        // Clone shallowly and remove fields that are not part of the public
 								        // schema expected by the OpenAI Responses API.
 								        // We shallow‑clone the item so that subsequent mutations (deleting
 								        // internal fields) do not affect the original object which may still
 								        // be referenced elsewhere (e.g. UI components).
 								        const clean = { ...item } as Record<string, unknown>;
 								        delete clean["duration_ms"];
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								        // Remove OpenAI-assigned identifiers and transient status so the
 								        // backend does not reject items that were never persisted because we
 								        // use `store: false`.
 								        delete clean["id"];
 								        delete clean["status"];
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								        return clean as unknown as ResponseInputItem;
 								      };
 								      if (this.disableResponseStorage) {
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								        // Remember where the existing transcript ends – everything after this
 								        // index in the upcoming `turnInput` list will be *new* for this turn
 								        // and therefore needs to be surfaced to the UI.
 								        transcriptPrefixLen = this.transcript.length;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								        // Ensure the transcript is up‑to‑date with the latest user input so
 								        // that subsequent iterations see a complete history.
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								        // `turnInput` is still empty at this point (it will be filled later).
 								        // We need to look at the *input* items the user just supplied.
 								        this.transcript.push(...filterToApiMessages(input));
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
 								        turnInput = [...this.transcript, ...abortOutputs].map(
 								          stripInternalFields,
 								        );
 								      } else {
 								        turnInput = [...abortOutputs, ...input].map(stripInternalFields);
 								      }
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
 								      this.onLoading(true);
 								      const staged: Array<ResponseItem | undefined> = [];
 								      const stageItem = (item: ResponseItem) => {
 								        // Ignore any stray events that belong to older generations.
 								        if (thisGeneration !== this.generation) {
 								          return;
 								        }
 								        // Store the item so the final flush can still operate on a complete list.
 								        // We'll nil out entries once they're delivered.
 								        const idx = staged.push(item) - 1;
 								        // Instead of emitting synchronously we schedule a short‑delay delivery.
 								        // This accomplishes two things:
 								        //   1. The UI still sees new messages almost immediately, creating the
 								        //      perception of real‑time updates.
 								        //   2. If the user calls `cancel()` in the small window right after the
 								        //      item was staged we can still abort the delivery because the
 								        //      generation counter will have been bumped by `cancel()`.
 								        setTimeout(() => {
 								          if (
 								            thisGeneration === this.generation &&
 								            !this.canceled &&
 								            !this.hardAbort.signal.aborted
 								          ) {
 								            this.onItem(item);
 								            // Mark as delivered so flush won't re-emit it
 								            staged[idx] = undefined;
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
 								            // When we operate without server‑side storage we keep our own
 								            // transcript so we can provide full context on subsequent calls.
 								            if (this.disableResponseStorage) {
 								              // Exclude system messages from transcript as they do not form
 								              // part of the assistant/user dialogue that the model needs.
 								              // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								              const role = (item as any).role;
 								              if (role !== "system") {
 								                // Clone the item to avoid mutating the object that is also
 								                // rendered in the UI. We need to strip auxiliary metadata
 								                // such as `duration_ms` which is not part of the Responses
 								                // API schema and therefore causes a 400 error when included
 								                // in subsequent requests whose context is sent verbatim.
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								                // Skip items that we have already inserted earlier or that the
 								                // model does not need to see again in the next turn.
 								                //   • function_call   – superseded by the forthcoming
 								                //     function_call_output.
 								                //   • reasoning       – internal only, never sent back.
 								                //   • user messages   – we added these to the transcript when
 								                //     building the first turnInput; stageItem would add a
 								                //     duplicate.
 								                if (
 								                  (item as ResponseInputItem).type === "function_call" ||
 								                  (item as ResponseInputItem).type === "reasoning" ||
 								                  ((item as ResponseInputItem).type === "message" &&
 								                    // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								                    (item as any).role === "user")
 								                ) {
 								                  return;
 								                }
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								                const clone: ResponseInputItem = {
 								                  ...(item as unknown as ResponseInputItem),
 								                } as ResponseInputItem;
 								                // The `duration_ms` field is only added to reasoning items to
 								                // show elapsed time in the UI. It must not be forwarded back
 								                // to the server.
 								                // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								                delete (clone as any).duration_ms;
 								                this.transcript.push(clone);
 								              }
 								            }
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								          }
 								        }, 10);
 								      };
 								      while (turnInput.length > 0) {
 								        if (this.canceled || this.hardAbort.signal.aborted) {
 								          this.onLoading(false);
 								          return;
 								        }
 								        // send request to openAI
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								        // Only surface the *new* input items to the UI – replaying the entire
 								        // transcript would duplicate messages that have already been shown in
 								        // earlier turns.
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								        // `turnInput` holds the *new* items that will be sent to the API in
 								        // this iteration.  Surface exactly these to the UI so that we do not
 								        // re‑emit messages from previous turns (which would duplicate user
 								        // prompts) and so that freshly generated `function_call_output`s are
 								        // shown immediately.
 								        // Figure out what subset of `turnInput` constitutes *new* information
 								        // for the UI so that we don’t spam the interface with repeats of the
 								        // entire transcript on every iteration when response storage is
 								        // disabled.
 								        const deltaInput = this.disableResponseStorage
 								          ? turnInput.slice(transcriptPrefixLen)
 								          : [...turnInput];
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								        for (const item of deltaInput) {
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								          stageItem(item as ResponseItem);
 								        }
 								        // Send request to OpenAI with retry on timeout
 								        let stream;
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								        // Retry loop for transient errors. Up to MAX_RETRIES attempts.
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								        const MAX_RETRIES = 5;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								        for (let attempt = 1; attempt <= MAX_RETRIES; attempt++) {
 								          try {
 								            let reasoning: Reasoning | undefined;
 								            if (this.model.startsWith("o")) {
 								              reasoning = { effort: "high" };
-												(fix) o3 instead of o3-mini  (#37)

* o3 instead of o3-mini
											
										
										
											2025-04-16 23:48:41 +05:30
+								              if (this.model === "o3" || this.model === "o4-mini") {
-												update summary to auto (#1)


											
										
										
											2025-04-16 10:44:19 -07:00
+								                reasoning.summary = "auto";
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								              }
 								            }
 								            const mergedInstructions = [prefix, this.instructions]
 								              .filter(Boolean)
 								              .join("\n");
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
 								            const responseCall =
 								              !this.config.provider ||
 								              this.config.provider?.toLowerCase() === "openai"
 								                ? (params: ResponseCreateParams) =>
 								                    this.oai.responses.create(params)
 								                : (params: ResponseCreateParams) =>
 								                    responsesCreateViaChatCompletions(
 								                      this.oai,
 								                      params as ResponseCreateParams & { stream: true },
 								                    );
-												fix: remove unnecessary isLoggingEnabled() checks (#420)

It appears that use of `isLoggingEnabled()` was erroneously copypasta'd
in many places. This PR updates its docstring to clarify that should
only be used to avoid constructing a potentially expensive docstring.
With this change, the only function that merits/uses this check is
`execCommand()`.

---
[//]: # (BEGIN SAPLING FOOTER)
Stack created with [Sapling](https://sapling-scm.com). Best reviewed
with [ReviewStack](https://reviewstack.dev/openai/codex/pull/420).
* #423
* __->__ #420
* #419
											
										
										
											2025-04-20 09:58:06 -07:00
+								            log(
 								              `instructions (length ${mergedInstructions.length}): ${mergedInstructions}`,
 								            );
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            // eslint-disable-next-line no-await-in-loop
-												feat: support multiple providers via Responses-Completion transformation (#247)

https://github.com/user-attachments/assets/9ecb51be-fa65-4e99-8512-abb898dda569

Implemented it as a transformation between Responses API and Completion
API so that it supports existing providers that implement the Completion
API and minimizes the changes needed to the codex repo.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
Co-authored-by: Fouad Matin <169186268+fouad-openai@users.noreply.github.com>
Co-authored-by: Fouad Matin <fouad@openai.com>
											
										
										
											2025-04-20 23:59:34 -04:00
+								            stream = await responseCall({
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								              model: this.model,
 								              instructions: mergedInstructions,
 								              input: turnInput,
 								              stream: true,
 								              parallel_tool_calls: false,
 								              reasoning,
-												feat: add flex mode option for cost savings (#372)

Adding in an option to turn on flex processing mode to reduce costs when
running the agent.

Bumped the openai typescript version to add the new feature.

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-18 22:15:01 -07:00
+								              ...(this.config.flexMode ? { service_tier: "flex" } : {}),
-												feat: add support for ZDR orgs (#481)

- Add `store: boolean` to `AgentLoop` to enable client-side storage of
response items
- Add `--disable-response-storage` arg + `disableResponseStorage` config
											
										
										
											2025-04-22 01:30:16 -07:00
+								              ...(this.disableResponseStorage
 								                ? { store: false }
 								                : {
 								                    store: true,
 								                    previous_response_id: lastResponseId || undefined,
 								                  }),
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								              tools: [shellTool],
 								              // Explicitly tell the model it is allowed to pick whatever
 								              // tool it deems appropriate.  Omitting this sometimes leads to
 								              // the model ignoring the available tools and responding with
 								              // plain text instead (resulting in a missing tool‑call).
 								              tool_choice: "auto",
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            });
 								            break;
 								          } catch (error) {
 								            const isTimeout = error instanceof APIConnectionTimeoutError;
 								            // Lazily look up the APIConnectionError class at runtime to
 								            // accommodate the test environment's minimal OpenAI mocks which
 								            // do not define the class.  Falling back to `false` when the
 								            // export is absent ensures the check never throws.
 								            // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								            const ApiConnErrCtor = (OpenAI as any).APIConnectionError as  // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								              | (new (...args: any) => Error)
 								              | undefined;
 								            const isConnectionError = ApiConnErrCtor
 								              ? error instanceof ApiConnErrCtor
 								              : false;
 								            // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								            const errCtx = error as any;
 								            const status =
 								              errCtx?.status ?? errCtx?.httpStatus ?? errCtx?.statusCode;
 								            const isServerError = typeof status === "number" && status >= 500;
 								            if (
 								              (isTimeout || isServerError || isConnectionError) &&
 								              attempt < MAX_RETRIES
 								            ) {
 								              log(
 								                `OpenAI request failed (attempt ${attempt}/${MAX_RETRIES}), retrying...`,
 								              );
 								              continue;
 								            }
 								            const isTooManyTokensError =
 								              (errCtx.param === "max_tokens" ||
 								                (typeof errCtx.message === "string" &&
 								                  /max_tokens is too large/i.test(errCtx.message))) &&
 								              errCtx.type === "invalid_request_error";
 								            if (isTooManyTokensError) {
 								              this.onItem({
 								                id: `error-${Date.now()}`,
 								                type: "message",
 								                role: "system",
 								                content: [
 								                  {
 								                    type: "input_text",
 								                    text: "⚠️  The current request exceeds the maximum context length supported by the chosen model. Please shorten the conversation, run /clear, or switch to a model with a larger context window and try again.",
 								                  },
 								                ],
 								              });
 								              this.onLoading(false);
 								              return;
 								            }
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								            const isRateLimit =
 								              status === 429 ||
 								              errCtx.code === "rate_limit_exceeded" ||
 								              errCtx.type === "rate_limit_exceeded" ||
 								              /rate limit/i.test(errCtx.message ?? "");
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            if (isRateLimit) {
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								              if (attempt < MAX_RETRIES) {
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								                // Exponential backoff: base wait * 2^(attempt-1), or use suggested retry time
 								                // if provided.
 								                let delayMs = RATE_LIMIT_RETRY_WAIT_MS * 2 ** (attempt - 1);
 								                // Parse suggested retry time from error message, e.g., "Please try again in 1.3s"
 								                const msg = errCtx?.message ?? "";
-												fix: update regex to better match the retry error messages (#266)

I think the retry issue is just that the regex is wrong, checkout the
reported error messages folks are seeing:

> message: 'Rate limit reached for o4-mini in organization
org-{redacted} on tokens per min (TPM): Limit 200000, Used 152566,
Requested 60651. Please try again in 3.965s. Visit
https://platform.openai.com/account/rate-limits to learn more.',

The error message uses `try again` not `retry again`

peep this regexpal: https://www.regexpal.com/?fam=155648
											
										
										
											2025-04-17 16:15:01 -04:00
+								                const m = /(?:retry|try) again in ([\d.]+)s/i.exec(msg);
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								                if (m && m[1]) {
 								                  const suggested = parseFloat(m[1]) * 1000;
 								                  if (!Number.isNaN(suggested)) {
 								                    delayMs = suggested;
 								                  }
 								                }
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								                log(
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								                  `OpenAI rate limit exceeded (attempt ${attempt}/${MAX_RETRIES}), retrying in ${Math.round(
 								                    delayMs,
 								                  )} ms...`,
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								                );
 								                // eslint-disable-next-line no-await-in-loop
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								                await new Promise((resolve) => setTimeout(resolve, delayMs));
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								                continue;
-												(feat) expontential back-off when encountering rate limit errors (#153)

...and try to parse the suggested time from the error message while we
don't yet have this in a structured way

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 17:37:12 -07:00
+								              } else {
 								                // We have exhausted all retry attempts. Surface a message so the user understands
 								                // why the request failed and can decide how to proceed (e.g. wait and retry later
 								                // or switch to a different model / account).
 								                const errorDetails = [
 								                  `Status: ${status || "unknown"}`,
 								                  `Code: ${errCtx.code || "unknown"}`,
 								                  `Type: ${errCtx.type || "unknown"}`,
 								                  `Message: ${errCtx.message || "unknown"}`,
 								                ].join(", ");
 								                this.onItem({
 								                  id: `error-${Date.now()}`,
 								                  type: "message",
 								                  role: "system",
 								                  content: [
 								                    {
 								                      type: "input_text",
 								                      text: `⚠️  Rate limit reached. Error details: ${errorDetails}. Please try again later.`,
 								                    },
 								                  ],
 								                });
 								                this.onLoading(false);
 								                return;
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
+								              }
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            }
-												(feat) basic retries when hitting rate limit errors (#105)

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

* w

Signed-off-by: Thibault Sottiaux <tibo@openai.com>

---------

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-16 13:47:23 -07:00
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            const isClientError =
 								              (typeof status === "number" &&
 								                status >= 400 &&
 								                status < 500 &&
 								                status !== 429) ||
 								              errCtx.code === "invalid_request_error" ||
 								              errCtx.type === "invalid_request_error";
 								            if (isClientError) {
 								              this.onItem({
 								                id: `error-${Date.now()}`,
 								                type: "message",
 								                role: "system",
 								                content: [
 								                  {
 								                    type: "input_text",
 								                    // Surface the request ID when it is present on the error so users
 								                    // can reference it when contacting support or inspecting logs.
 								                    text: (() => {
 								                      const reqId =
 								                        (
 								                          errCtx as Partial<{
 								                            request_id?: string;
 								                            requestId?: string;
 								                          }>
 								                        )?.request_id ??
 								                        (
 								                          errCtx as Partial<{
 								                            request_id?: string;
 								                            requestId?: string;
 								                          }>
 								                        )?.requestId;
-												(feat) add request error details (#31)

Signed-off-by: Adam Montgomery <montgomery.adam@gmail.com>
											
										
										
											2025-04-16 14:23:42 -04:00
+								                      const errorDetails = [
 								                        `Status: ${status || "unknown"}`,
 								                        `Code: ${errCtx.code || "unknown"}`,
 								                        `Type: ${errCtx.type || "unknown"}`,
 								                        `Message: ${errCtx.message || "unknown"}`,
 								                      ].join(", ");
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								                      return `⚠️  OpenAI rejected the request${
 								                        reqId ? ` (request ID: ${reqId})` : ""
-												(feat) add request error details (#31)

Signed-off-by: Adam Montgomery <montgomery.adam@gmail.com>
											
										
										
											2025-04-16 14:23:42 -04:00
+								                      }. Error details: ${errorDetails}. Please verify your settings and try again.`;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								                    })(),
 								                  },
 								                ],
 								              });
 								              this.onLoading(false);
 								              return;
 								            }
 								            throw error;
 								          }
 								        }
 								        // If the user requested cancellation while we were awaiting the network
 								        // request, abort immediately before we start handling the stream.
 								        if (this.canceled || this.hardAbort.signal.aborted) {
 								          // `stream` is defined; abort to avoid wasting tokens/server work
 								          try {
 								            (
 								              stream as { controller?: { abort?: () => void } }
 								            )?.controller?.abort?.();
 								          } catch {
 								            /* ignore */
 								          }
 								          this.onLoading(false);
 								          return;
 								        }
 								        // Keep track of the active stream so it can be aborted on demand.
 								        this.currentStream = stream;
 								        // guard against an undefined stream before iterating
 								        if (!stream) {
 								          this.onLoading(false);
 								          log("AgentLoop.run(): stream is undefined");
 								          return;
 								        }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								        const MAX_STREAM_RETRIES = 5;
 								        let streamRetryAttempt = 0;
 								        // eslint-disable-next-line no-constant-condition
 								        while (true) {
 								          try {
-												fix: don't clear turn input before retries (#611)

The current turn input in the agent loop is being discarded before
consuming the stream events which causes the stream reconnect (after
rate limit failure) to not include the inputs. Since the new stream
includes the previous response ID, it triggers a bad request exception
considering the input doesn't match what OpenAI has stored on the server
side and subsequently a very confusing error message of: `No tool output
found for function call call_xyz`.

This should fix https://github.com/openai/codex/issues/586.

## Testing

I have a personal project that I'm working on that runs multiple Codex
CLIs in parallel and often runs into rate limit errors (as seen in the
OpenAI logs). After making this change, I am no longer experiencing
Codex crashing and it was able to retry and handle everything gracefully
until completion (even though I still see rate limiting in the OpenAI
logs).
											
										
										
											2025-04-24 04:29:36 -07:00
+								            let newTurnInput: Array<ResponseInputItem> = [];
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								            // eslint-disable-next-line no-await-in-loop
 								            for await (const event of stream as AsyncIterable<ResponseEvent>) {
 								              log(`AgentLoop.run(): response event ${event.type}`);
 								              // process and surface each item (no-op until we can depend on streaming events)
 								              if (event.type === "response.output_item.done") {
 								                const item = event.item;
 								                // 1) if it's a reasoning item, annotate it
 								                type ReasoningItem = { type?: string; duration_ms?: number };
 								                const maybeReasoning = item as ReasoningItem;
 								                if (maybeReasoning.type === "reasoning") {
 								                  maybeReasoning.duration_ms = Date.now() - thinkingStart;
 								                }
 								                if (item.type === "function_call") {
 								                  // Track outstanding tool call so we can abort later if needed.
 								                  // The item comes from the streaming response, therefore it has
 								                  // either `id` (chat) or `call_id` (responses) – we normalise
 								                  // by reading both.
 								                  const callId =
 								                    (item as { call_id?: string; id?: string }).call_id ??
 								                    (item as { id?: string }).id;
 								                  if (callId) {
 								                    this.pendingAborts.add(callId);
 								                  }
 								                } else {
 								                  stageItem(item as ResponseItem);
 								                }
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								              }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
 								              if (event.type === "response.completed") {
 								                if (thisGeneration === this.generation && !this.canceled) {
 								                  for (const item of event.response.output) {
 								                    stageItem(item as ResponseItem);
 								                  }
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								                }
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								                if (
 								                  event.response.status === "completed" ||
 								                  (event.response.status as unknown as string) ===
 								                    "requires_action"
 								                ) {
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								                  // TODO: remove this once we can depend on streaming events
-												fix: don't clear turn input before retries (#611)

The current turn input in the agent loop is being discarded before
consuming the stream events which causes the stream reconnect (after
rate limit failure) to not include the inputs. Since the new stream
includes the previous response ID, it triggers a bad request exception
considering the input doesn't match what OpenAI has stored on the server
side and subsequently a very confusing error message of: `No tool output
found for function call call_xyz`.

This should fix https://github.com/openai/codex/issues/586.

## Testing

I have a personal project that I'm working on that runs multiple Codex
CLIs in parallel and often runs into rate limit errors (as seen in the
OpenAI logs). After making this change, I am no longer experiencing
Codex crashing and it was able to retry and handle everything gracefully
until completion (even though I still see rate limiting in the OpenAI
logs).
											
										
										
											2025-04-24 04:29:36 -07:00
+								                  newTurnInput = await this.processEventsWithoutStreaming(
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								                    event.response.output,
 								                    stageItem,
 								                  );
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
 								                  // When we do not use server‑side storage we maintain our
 								                  // own transcript so that *future* turns still contain full
 								                  // conversational context. However, whether we advance to
 								                  // another loop iteration should depend solely on the
 								                  // presence of *new* input items (i.e. items that were not
 								                  // part of the previous request). Re‑sending the transcript
 								                  // by itself would create an infinite request loop because
 								                  // `turnInput.length` would never reach zero.
 								                  if (this.disableResponseStorage) {
 								                    // 1) Append the freshly emitted output to our local
 								                    //    transcript (minus non‑message items the model does
 								                    //    not need to see again).
 								                    const cleaned = filterToApiMessages(
 								                      event.response.output.map(stripInternalFields),
 								                    );
 								                    this.transcript.push(...cleaned);
 								                    // 2) Determine the *delta* (newTurnInput) that must be
 								                    //    sent in the next iteration. If there is none we can
 								                    //    safely terminate the loop – the transcript alone
 								                    //    does not constitute new information for the
 								                    //    assistant to act upon.
 								                    const delta = filterToApiMessages(
 								                      newTurnInput.map(stripInternalFields),
 								                    );
 								                    if (delta.length === 0) {
 								                      // No new input => end conversation.
-												fix: don't clear turn input before retries (#611)

The current turn input in the agent loop is being discarded before
consuming the stream events which causes the stream reconnect (after
rate limit failure) to not include the inputs. Since the new stream
includes the previous response ID, it triggers a bad request exception
considering the input doesn't match what OpenAI has stored on the server
side and subsequently a very confusing error message of: `No tool output
found for function call call_xyz`.

This should fix https://github.com/openai/codex/issues/586.

## Testing

I have a personal project that I'm working on that runs multiple Codex
CLIs in parallel and often runs into rate limit errors (as seen in the
OpenAI logs). After making this change, I am no longer experiencing
Codex crashing and it was able to retry and handle everything gracefully
until completion (even though I still see rate limiting in the OpenAI
logs).
											
										
										
											2025-04-24 04:29:36 -07:00
+								                      newTurnInput = [];
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								                    } else {
 								                      // Re‑send full transcript *plus* the new delta so the
 								                      // stateless backend receives complete context.
-												fix: don't clear turn input before retries (#611)

The current turn input in the agent loop is being discarded before
consuming the stream events which causes the stream reconnect (after
rate limit failure) to not include the inputs. Since the new stream
includes the previous response ID, it triggers a bad request exception
considering the input doesn't match what OpenAI has stored on the server
side and subsequently a very confusing error message of: `No tool output
found for function call call_xyz`.

This should fix https://github.com/openai/codex/issues/586.

## Testing

I have a personal project that I'm working on that runs multiple Codex
CLIs in parallel and often runs into rate limit errors (as seen in the
OpenAI logs). After making this change, I am no longer experiencing
Codex crashing and it was able to retry and handle everything gracefully
until completion (even though I still see rate limiting in the OpenAI
logs).
											
										
										
											2025-04-24 04:29:36 -07:00
+								                      newTurnInput = [...this.transcript, ...delta];
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								                      // The prefix ends at the current transcript length –
 								                      // everything after this index is new for the next
 								                      // iteration.
 								                      transcriptPrefixLen = this.transcript.length;
 								                    }
 								                  }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								                }
 								                lastResponseId = event.response.id;
 								                this.onLastResponseId(event.response.id);
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								              }
 								            }
-												fix: don't clear turn input before retries (#611)

The current turn input in the agent loop is being discarded before
consuming the stream events which causes the stream reconnect (after
rate limit failure) to not include the inputs. Since the new stream
includes the previous response ID, it triggers a bad request exception
considering the input doesn't match what OpenAI has stored on the server
side and subsequently a very confusing error message of: `No tool output
found for function call call_xyz`.

This should fix https://github.com/openai/codex/issues/586.

## Testing

I have a personal project that I'm working on that runs multiple Codex
CLIs in parallel and often runs into rate limit errors (as seen in the
OpenAI logs). After making this change, I am no longer experiencing
Codex crashing and it was able to retry and handle everything gracefully
until completion (even though I still see rate limiting in the OpenAI
logs).
											
										
										
											2025-04-24 04:29:36 -07:00
 								            // Set after we have consumed all stream events in case the stream wasn't
 								            // complete or we missed events for whatever reason. That way, we will set
 								            // the next turn to an empty array to prevent an infinite loop.
 								            // And don't update the turn input too early otherwise we won't have the
 								            // current turn inputs available for retries.
 								            turnInput = newTurnInput;
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								            // Stream finished successfully – leave the retry loop.
 								            break;
 								          } catch (err: unknown) {
 								            const isRateLimitError = (e: unknown): boolean => {
 								              if (!e || typeof e !== "object") {
 								                return false;
 								              }
 								              // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								              const ex: any = e;
 								              return (
 								                ex.status === 429 ||
 								                ex.code === "rate_limit_exceeded" ||
 								                ex.type === "rate_limit_exceeded"
 								              );
 								            };
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								            if (
 								              isRateLimitError(err) &&
 								              streamRetryAttempt < MAX_STREAM_RETRIES
 								            ) {
 								              streamRetryAttempt += 1;
 								              const waitMs =
 								                RATE_LIMIT_RETRY_WAIT_MS * 2 ** (streamRetryAttempt - 1);
 								              log(
 								                `OpenAI stream rate‑limited – retry ${streamRetryAttempt}/${MAX_STREAM_RETRIES} in ${waitMs} ms`,
 								              );
 								              // Give the server a breather before retrying.
 								              // eslint-disable-next-line no-await-in-loop
 								              await new Promise((res) => setTimeout(res, waitMs));
 								              // Re‑create the stream with the *same* parameters.
 								              let reasoning: Reasoning | undefined;
 								              if (this.model.startsWith("o")) {
 								                reasoning = { effort: "high" };
 								                if (this.model === "o3" || this.model === "o4-mini") {
 								                  reasoning.summary = "auto";
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								                }
 								              }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
 								              const mergedInstructions = [prefix, this.instructions]
 								                .filter(Boolean)
 								                .join("\n");
 								              const responseCall =
 								                !this.config.provider ||
 								                this.config.provider?.toLowerCase() === "openai"
 								                  ? (params: ResponseCreateParams) =>
 								                      this.oai.responses.create(params)
 								                  : (params: ResponseCreateParams) =>
 								                      responsesCreateViaChatCompletions(
 								                        this.oai,
 								                        params as ResponseCreateParams & { stream: true },
 								                      );
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								              log(
 								                "agentLoop.run(): responseCall(1): turnInput: " +
 								                  JSON.stringify(turnInput),
 								              );
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								              // eslint-disable-next-line no-await-in-loop
 								              stream = await responseCall({
 								                model: this.model,
 								                instructions: mergedInstructions,
 								                input: turnInput,
 								                stream: true,
 								                parallel_tool_calls: false,
 								                reasoning,
 								                ...(this.config.flexMode ? { service_tier: "flex" } : {}),
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
+								                ...(this.disableResponseStorage
 								                  ? { store: false }
 								                  : {
 								                      store: true,
 								                      previous_response_id: lastResponseId || undefined,
 								                    }),
 								                tools: [shellTool],
 								                tool_choice: "auto",
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								              });
 								              this.currentStream = stream;
 								              // Continue to outer while to consume new stream.
 								              continue;
 								            }
 								            // Gracefully handle an abort triggered via `cancel()` so that the
 								            // consumer does not see an unhandled exception.
 								            if (err instanceof Error && err.name === "AbortError") {
 								              if (!this.canceled) {
 								                // It was aborted for some other reason; surface the error.
 								                throw err;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								              }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								              this.onLoading(false);
 								              return;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								            // Suppress internal stack on JSON parse failures
 								            if (err instanceof SyntaxError) {
 								              this.onItem({
 								                id: `error-${Date.now()}`,
 								                type: "message",
 								                role: "system",
 								                content: [
 								                  {
 								                    type: "input_text",
 								                    text: "⚠️ Failed to parse streaming response (invalid JSON). Please `/clear` to reset.",
 								                  },
 								                ],
 								              });
 								              this.onLoading(false);
 								              return;
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								            // Handle OpenAI API quota errors
 								            if (
 								              err instanceof Error &&
 								              (err as { code?: string }).code === "insufficient_quota"
 								            ) {
 								              this.onItem({
 								                id: `error-${Date.now()}`,
 								                type: "message",
 								                role: "system",
 								                content: [
 								                  {
 								                    type: "input_text",
 								                    text: "⚠️ Insufficient quota. Please check your billing details and retry.",
 								                  },
 								                ],
 								              });
 								              this.onLoading(false);
 								              return;
 								            }
 								            throw err;
 								          } finally {
 								            this.currentStream = null;
-												gracefully handle SSE parse errors and suppress raw parser code (#367)

Closes #187
Closes #358

---------

Co-authored-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-19 19:54:29 +05:30
+								          }
-												agent-loop: minimal mid-stream #429 retry loop using existing back-off (#506)

As requested by @tibo-openai at
https://github.com/openai/codex/pull/357#issuecomment-2816554203, this
attempts a more minimal implementation of #357 that preserves as much as
possible of the existing code's exponential backoff logic.

Adds a small retry wrapper around the streaming for‑await loop so that
HTTP 429s which occur *after* the stream has started no longer crash the
CLI.

Highlights
• Re‑uses existing RATE_LIMIT_RETRY_WAIT_MS constant and 5‑attempt
limit.
• Exponential back‑off identical to initial request handling. 

This comment is probably more useful here in the PR:
// The OpenAI SDK may raise a 429 (rate‑limit) *after* the stream has
// started. Prior logic already retries the initial `responses.create`
        // call, but we need to add equivalent resilience for mid‑stream
        // failures.  We keep the implementation minimal by wrapping the
// existing `for‑await` loop in a small retry‑for‑loop that re‑creates
        // the stream with exponential back‑off.
											
										
										
											2025-04-22 08:02:10 -07:00
+								        } // end while retry loop
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
 								        log(
 								          `Turn inputs (${turnInput.length}) - ${turnInput
 								            .map((i) => i.type)
 								            .join(", ")}`,
 								        );
 								      }
 								      // Flush staged items if the run concluded successfully (i.e. the user did
 								      // not invoke cancel() or terminate() during the turn).
 								      const flush = () => {
 								        if (
 								          !this.canceled &&
 								          !this.hardAbort.signal.aborted &&
 								          thisGeneration === this.generation
 								        ) {
 								          // Only emit items that weren't already delivered above
 								          for (const item of staged) {
 								            if (item) {
 								              this.onItem(item);
 								            }
 								          }
 								        }
 								        // At this point the turn finished without the user invoking
 								        // `cancel()`.  Any outstanding function‑calls must therefore have been
 								        // satisfied, so we can safely clear the set that tracks pending aborts
 								        // to avoid emitting duplicate synthetic outputs in subsequent runs.
 								        this.pendingAborts.clear();
 								        // Now emit system messages recording the per‑turn *and* cumulative
 								        // thinking times so UIs and tests can surface/verify them.
 								        // const thinkingEnd = Date.now();
-												Add link to cookbook (#2)


											
										
										
											2025-04-16 10:15:46 -07:00
+								        // 1) Per‑turn measurement – exact time spent between request and
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								        //    response for *this* command.
 								        // this.onItem({
 								        //   id: `thinking-${thinkingEnd}`,
 								        //   type: "message",
 								        //   role: "system",
 								        //   content: [
 								        //     {
 								        //       type: "input_text",
 								        //       text: `🤔  Thinking time: ${Math.round(
 								        //         (thinkingEnd - thinkingStart) / 1000
 								        //       )} s`,
 								        //     },
 								        //   ],
 								        // });
-												Add link to cookbook (#2)


											
										
										
											2025-04-16 10:15:46 -07:00
+								        // 2) Session‑wide cumulative counter so users can track overall wait
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								        //    time across multiple turns.
 								        // this.cumulativeThinkingMs += thinkingEnd - thinkingStart;
 								        // this.onItem({
 								        //   id: `thinking-total-${thinkingEnd}`,
 								        //   type: "message",
 								        //   role: "system",
 								        //   content: [
 								        //     {
 								        //       type: "input_text",
 								        //       text: `⏱  Total thinking time: ${Math.round(
 								        //         this.cumulativeThinkingMs / 1000
 								        //       )} s`,
 								        //     },
 								        //   ],
 								        // });
 								        this.onLoading(false);
 								      };
 								      // Delay flush slightly to allow a near‑simultaneous cancel() to land.
 								      setTimeout(flush, 30);
 								      // End of main logic. The corresponding catch block for the wrapper at the
 								      // start of this method follows next.
 								    } catch (err) {
 								      // Handle known transient network/streaming issues so they do not crash the
 								      // CLI. We currently match Node/undici's `ERR_STREAM_PREMATURE_CLOSE`
 								      // error which manifests when the HTTP/2 stream terminates unexpectedly
 								      // (e.g. during brief network hiccups).
 								      const isPrematureClose =
 								        err instanceof Error &&
 								        // eslint-disable-next-line
 								        ((err as any).code === "ERR_STREAM_PREMATURE_CLOSE" ||
 								          err.message?.includes("Premature close"));
 								      if (isPrematureClose) {
 								        try {
 								          this.onItem({
 								            id: `error-${Date.now()}`,
 								            type: "message",
 								            role: "system",
 								            content: [
 								              {
 								                type: "input_text",
 								                text: "⚠️  Connection closed prematurely while waiting for the model. Please try again.",
 								              },
 								            ],
 								          });
 								        } catch {
-												chore: consolidate model utils and drive-by cleanups (#476)

Signed-off-by: Thibault Sottiaux <tibo@openai.com>
											
										
										
											2025-04-21 12:33:57 -04:00
+								          /* no-op – emitting the error message is best‑effort */
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								        }
 								        this.onLoading(false);
 								        return;
 								      }
 								      // -------------------------------------------------------------------
 								      // Catch‑all handling for other network or server‑side issues so that
 								      // transient failures do not crash the CLI. We intentionally keep the
 								      // detection logic conservative to avoid masking programming errors. A
 								      // failure is treated as retry‑worthy/user‑visible when any of the
 								      // following apply:
 								      //   • the error carries a recognised Node.js network errno ‑ style code
 								      //     (e.g. ECONNRESET, ETIMEDOUT …)
 								      //   • the OpenAI SDK attached an HTTP `status` >= 500 indicating a
 								      //     server‑side problem.
-												bugfix: additional error handling logic for model errors that occur in stream (#203)

**What is  added?**

Additional error handling functionality is added before the errors are
thrown to be handled by upstream handlers. The changes improves the user
experience and make the error handling smoother (and more informative).

**Why is it added?**
Before this addition, when a user tried to use a model they needed
previous setup for, the program crashed. This is not necessary here, and
informative message is sufficient and enhances user experience. This
adheres to the specifications stated in the code file as well by not
masking potential logical error detection. Following is before and
after:


![first](https://github.com/user-attachments/assets/0ce7c57d-8159-4cf7-8a53-3062cfd04dc8)

![second](https://github.com/user-attachments/assets/a9f24410-d76d-43d4-a0e2-ec513026843d)

Moreover, AFAIK no logic was present to handle this or a similar issue
in upstream handlers.

**How is it scoped? Why won't this mask other errors?**
The new brach triggers *only* for `invalid_request_error` events whose
`code` is model related (`model_not_found`)

This also doesn't prevent the detection (for the case of masking logical
errors) of wrong model names, as they would have been caught earlier on.

The code passes test, lint and type checks. I believe relevant
documentation is added, but I would be more than happy to do further
fixes in the code if necessary.
											
										
										
											2025-04-17 17:09:27 +02:00
+								      //   • the error is model specific and detected in stream.
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      // If matched we emit a single system message to inform the user and
 								      // resolve gracefully so callers can choose to retry.
 								      // -------------------------------------------------------------------
 								      const NETWORK_ERRNOS = new Set([
 								        "ECONNRESET",
 								        "ECONNREFUSED",
 								        "EPIPE",
 								        "ENOTFOUND",
 								        "ETIMEDOUT",
 								        "EAI_AGAIN",
 								      ]);
 								      const isNetworkOrServerError = (() => {
 								        if (!err || typeof err !== "object") {
 								          return false;
 								        }
 								        // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        const e: any = err;
 								        // Direct instance check for connection errors thrown by the OpenAI SDK.
 								        // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        const ApiConnErrCtor = (OpenAI as any).APIConnectionError as  // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								          | (new (...args: any) => Error)
 								          | undefined;
 								        if (ApiConnErrCtor && e instanceof ApiConnErrCtor) {
 								          return true;
 								        }
 								        if (typeof e.code === "string" && NETWORK_ERRNOS.has(e.code)) {
 								          return true;
 								        }
 								        // When the OpenAI SDK nests the underlying network failure inside the
 								        // `cause` property we surface it as well so callers do not see an
 								        // unhandled exception for errors like ENOTFOUND, ECONNRESET …
 								        if (
 								          e.cause &&
 								          typeof e.cause === "object" &&
 								          NETWORK_ERRNOS.has((e.cause as { code?: string }).code ?? "")
 								        ) {
 								          return true;
 								        }
 								        if (typeof e.status === "number" && e.status >= 500) {
 								          return true;
 								        }
 								        // Fallback to a heuristic string match so we still catch future SDK
 								        // variations without enumerating every errno.
 								        if (
 								          typeof e.message === "string" &&
 								          /network|socket|stream/i.test(e.message)
 								        ) {
 								          return true;
 								        }
 								        return false;
 								      })();
 								      if (isNetworkOrServerError) {
 								        try {
 								          const msgText =
 								            "⚠️  Network error while contacting OpenAI. Please check your connection and try again.";
 								          this.onItem({
 								            id: `error-${Date.now()}`,
 								            type: "message",
 								            role: "system",
 								            content: [
 								              {
 								                type: "input_text",
 								                text: msgText,
 								              },
 								            ],
 								          });
 								        } catch {
 								          /* best‑effort */
 								        }
 								        this.onLoading(false);
 								        return;
 								      }
-												bugfix: additional error handling logic for model errors that occur in stream (#203)

**What is  added?**

Additional error handling functionality is added before the errors are
thrown to be handled by upstream handlers. The changes improves the user
experience and make the error handling smoother (and more informative).

**Why is it added?**
Before this addition, when a user tried to use a model they needed
previous setup for, the program crashed. This is not necessary here, and
informative message is sufficient and enhances user experience. This
adheres to the specifications stated in the code file as well by not
masking potential logical error detection. Following is before and
after:


![first](https://github.com/user-attachments/assets/0ce7c57d-8159-4cf7-8a53-3062cfd04dc8)

![second](https://github.com/user-attachments/assets/a9f24410-d76d-43d4-a0e2-ec513026843d)

Moreover, AFAIK no logic was present to handle this or a similar issue
in upstream handlers.

**How is it scoped? Why won't this mask other errors?**
The new brach triggers *only* for `invalid_request_error` events whose
`code` is model related (`model_not_found`)

This also doesn't prevent the detection (for the case of masking logical
errors) of wrong model names, as they would have been caught earlier on.

The code passes test, lint and type checks. I believe relevant
documentation is added, but I would be more than happy to do further
fixes in the code if necessary.
											
										
										
											2025-04-17 17:09:27 +02:00
+								      const isInvalidRequestError = () => {
 								        if (!err || typeof err !== "object") {
 								          return false;
 								        }
 								        // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								        const e: any = err;
 								        if (
 								          e.type === "invalid_request_error" &&
 								          e.code === "model_not_found"
 								        ) {
 								          return true;
 								        }
 								        if (
 								          e.cause &&
 								          e.cause.type === "invalid_request_error" &&
 								          e.cause.code === "model_not_found"
 								        ) {
 								          return true;
 								        }
 								        return false;
 								      };
 								      if (isInvalidRequestError()) {
 								        try {
 								          // Extract request ID and error details from the error object
 								          // eslint-disable-next-line @typescript-eslint/no-explicit-any
 								          const e: any = err;
 								          const reqId =
 								            e.request_id ??
 								            (e.cause && e.cause.request_id) ??
 								            (e.cause && e.cause.requestId);
 								          const errorDetails = [
 								            `Status: ${e.status || (e.cause && e.cause.status) || "unknown"}`,
 								            `Code: ${e.code || (e.cause && e.cause.code) || "unknown"}`,
 								            `Type: ${e.type || (e.cause && e.cause.type) || "unknown"}`,
 								            `Message: ${
 								              e.message || (e.cause && e.cause.message) || "unknown"
 								            }`,
 								          ].join(", ");
 								          const msgText = `⚠️  OpenAI rejected the request${
 								            reqId ? ` (request ID: ${reqId})` : ""
 								          }. Error details: ${errorDetails}. Please verify your settings and try again.`;
 								          this.onItem({
 								            id: `error-${Date.now()}`,
 								            type: "message",
 								            role: "system",
 								            content: [
 								              {
 								                type: "input_text",
 								                text: msgText,
 								              },
 								            ],
 								          });
 								        } catch {
 								          /* best-effort */
 								        }
 								        this.onLoading(false);
 								        return;
 								      }
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								      // Re‑throw all other errors so upstream handlers can decide what to do.
 								      throw err;
 								    }
 								  }
 								  // we need until we can depend on streaming events
 								  private async processEventsWithoutStreaming(
 								    output: Array<ResponseInputItem>,
 								    emitItem: (item: ResponseItem) => void,
 								  ): Promise<Array<ResponseInputItem>> {
 								    // If the agent has been canceled we should short‑circuit immediately to
 								    // avoid any further processing (including potentially expensive tool
 								    // calls). Returning an empty array ensures the main run‑loop terminates
 								    // promptly.
 								    if (this.canceled) {
 								      return [];
 								    }
 								    const turnInput: Array<ResponseInputItem> = [];
 								    for (const item of output) {
 								      if (item.type === "function_call") {
 								        if (alreadyProcessedResponses.has(item.id)) {
 								          continue;
 								        }
 								        alreadyProcessedResponses.add(item.id);
 								        // eslint-disable-next-line no-await-in-loop
 								        const result = await this.handleFunctionCall(item);
 								        turnInput.push(...result);
 								      }
 								      emitItem(item as ResponseItem);
 								    }
 								    return turnInput;
 								  }
 								}
 								const prefix = `You are operating as and within the Codex CLI, a terminal-based agentic coding assistant built by OpenAI. It wraps OpenAI models to enable natural language interaction with a local codebase. You are expected to be precise, safe, and helpful.
-												Add link to cookbook (#2)


											
										
										
											2025-04-16 10:15:46 -07:00
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								You can:
 								- Receive user prompts, project context, and files.
 								- Stream responses and emit function calls (e.g., shell commands, code edits).
 								- Apply patches, run commands, and manage user approvals based on policy.
 								- Work inside a sandboxed, git-backed workspace with rollback support.
 								- Log telemetry so sessions can be replayed or inspected later.
-												fix: prompt typo (#81)

* fix: developer typo

* fix: typo
											
										
										
											2025-04-16 14:43:10 -05:00
+								- More details on your functionality are available at \`codex --help\`
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
 								The Codex CLI is open-sourced. Don't confuse yourself with the old Codex language model built by OpenAI many moons ago (this is understandably top of mind for you!). Within this context, Codex refers to the open-source agentic coding interface.
 								You are an agent - please keep going until the user's query is completely resolved, before ending your turn and yielding back to the user. Only terminate your turn when you are sure that the problem is solved. If you are not sure about file content or codebase structure pertaining to the user's request, use your tools to read files and gather the relevant information: do NOT guess or make up an answer.
 								Please resolve the user's task by editing and testing the code files in your current code execution session. You are a deployed coding agent. Your session allows for you to modify and run code. The repo(s) are already cloned in your working directory, and you must fully solve the problem for your answer to be considered correct.
 								You MUST adhere to the following criteria when executing the task:
 								- Working on the repo(s) in the current environment is allowed, even if they are proprietary.
 								- Analyzing code for vulnerabilities is allowed.
 								- Showing user code and tool call details is allowed.
-												fix: prompt typo (#81)

* fix: developer typo

* fix: typo
											
										
										
											2025-04-16 14:43:10 -05:00
+								- User instructions may overwrite the *CODING GUIDELINES* section in this developer message.
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								- Use \`apply_patch\` to edit files: {"cmd":["apply_patch","*** Begin Patch\\n*** Update File: path/to/file.py\\n@@ def example():\\n-  pass\\n+  return 123\\n*** End Patch"]}
 								- If completing the user's task requires writing or modifying files:
 								    - Your code and final answer should follow these *CODING GUIDELINES*:
 								        - Fix the problem at the root cause rather than applying surface-level patches, when possible.
 								        - Avoid unneeded complexity in your solution.
 								            - Ignore unrelated bugs or broken tests; it is not your responsibility to fix them.
 								        - Update documentation as necessary.
 								        - Keep changes consistent with the style of the existing codebase. Changes should be minimal and focused on the task.
 								            - Use \`git log\` and \`git blame\` to search the history of the codebase if additional context is required; internet access is disabled.
 								        - NEVER add copyright or license headers unless specifically requested.
 								        - You do not need to \`git commit\` your changes; this will be done automatically for you.
 								        - If there is a .pre-commit-config.yaml, use \`pre-commit run --files ...\` to check that your changes pass the pre-commit checks. However, do not fix pre-existing errors on lines you didn't touch.
 								            - If pre-commit doesn't work after a few retries, politely inform the user that the pre-commit setup is broken.
 								        - Once you finish coding, you must
 								            - Check \`git status\` to sanity check your changes; revert any scratch files or changes.
-												fix: add missing "as" in prompt prefix in agent loop (#186)

# Description

This PR fixes a typo where the prompt prefix for the agent loop was
missing the word "as"

# Changes

* Added missing word "as" within the agent loop prompt prefix

# Benefits

* The prompt is now grammatically correct and clearer

# Testing

* Manually tested the fix
											
										
										
											2025-04-17 01:16:16 -04:00
+								            - Remove all inline comments you added as much as possible, even if they look normal. Check using \`git diff\`. Inline comments must be generally avoided, unless active maintainers of the repo, after long careful study of the code and the issue, will still misinterpret the code without the comments.
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								            - Check if you accidentally add copyright or license headers. If so, remove them.
 								            - Try to run pre-commit if it is available.
 								            - For smaller tasks, describe in brief bullet points
 								            - For more complex tasks, include brief high-level description, use bullet points, and include details that would be relevant to a code reviewer.
 								- If completing the user's task DOES NOT require writing or modifying files (e.g., the user asks a question about the code base):
-												fix typo in prompt (#558)


											
										
										
											2025-04-22 15:15:28 -06:00
+								    - Respond in a friendly tone as a remote teammate, who is knowledgeable, capable and eager to help with coding.
-												Initial commit

Signed-off-by: Ilan Bigio <ilan@openai.com>

											
										
										
											2025-04-16 12:56:08 -04:00
+								- When your task involves writing or modifying files:
 								    - Do NOT tell the user to "save the file" or "copy the code into a file" if you already created or modified the file using \`apply_patch\`. Instead, reference the file as already saved.
 								    - Do NOT show the full contents of large files you have already written, unless the user explicitly asks for them.`;
-												fix: agent loop for disable response storage (#543)

- Fixes post-merge of #506

---------

Co-authored-by: Ilan Bigio <ilan@openai.com>
											
										
										
											2025-04-22 13:49:10 -07:00
 								function filterToApiMessages(
 								  items: Array<ResponseInputItem>,
 								): Array<ResponseInputItem> {
 								  return items.filter((it) => {
 								    if (it.type === "message" && it.role === "system") {
 								      return false;
 								    }
 								    if (it.type === "reasoning") {
 								      return false;
 								    }
 								    return true;
 								  });
 								}