fix(agents): preserve typed-block order and fall through on empty content arrays

briandevans · briandevans · commit 06b26221735b · 2026-04-18T06:44:04.000+01:00
diff --git a/src/agents/openai-transport-stream.test.ts b/src/agents/openai-transport-stream.test.ts
@@ -2156,4 +2156,178 @@ describe("openai transport stream", () => {
     expect(assembledText).toBe("Hello! How can I help?");
     expect(assembledThinking).toBe("Let me reason: step one. Step two.");
   });
+
+  it("preserves typed-block order when delta.content arrays interleave text and thinking", async () => {
+    // Locks in the Codex review concern: a delta.content array shaped
+    // `[{type:"text",…},{type:"thinking",…},{type:"text",…}]` must produce
+    // text → thinking → text blocks in that order, not coalesce into one
+    // text block followed by one thinking block.
+    const model = {
+      id: "mistral-small-latest",
+      name: "Mistral Small Latest",
+      api: "openai-completions",
+      provider: "mistral",
+      baseUrl: "https://api.mistral.ai/v1",
+      reasoning: true,
+      input: ["text"],
+      cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+      contextWindow: 128000,
+      maxTokens: 8192,
+    } satisfies Model<"openai-completions">;
+
+    const output = {
+      role: "assistant" as const,
+      content: [],
+      api: model.api,
+      provider: model.provider,
+      model: model.id,
+      usage: {
+        input: 0,
+        output: 0,
+        cacheRead: 0,
+        cacheWrite: 0,
+        totalTokens: 0,
+        cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0, total: 0 },
+      },
+      stopReason: "stop",
+      timestamp: Date.now(),
+    };
+
+    const stream: { push(event: unknown): void } = { push() {} };
+
+    const mockChunks = [
+      {
+        id: "chatcmpl-mistral-order",
+        object: "chat.completion.chunk" as const,
+        choices: [
+          {
+            index: 0,
+            delta: {
+              content: [
+                { type: "text", text: "intro." },
+                { type: "thinking", thinking: "thought." },
+                { type: "text", text: "outro." },
+              ],
+            } as unknown,
+            logprobs: null,
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: "chatcmpl-mistral-order",
+        object: "chat.completion.chunk" as const,
+        choices: [{ index: 0, delta: {}, logprobs: null, finish_reason: "stop" }],
+      },
+    ] as const;
+
+    async function* mockStream() {
+      for (const chunk of mockChunks) {
+        yield chunk as never;
+      }
+    }
+
+    await __testing.processOpenAICompletionsStream(mockStream(), output, model, stream);
+
+    expect(output.content.map((block) => (block as { type: string }).type)).toEqual([
+      "text",
+      "thinking",
+      "text",
+    ]);
+    expect((output.content[0] as { text: string }).text).toBe("intro.");
+    expect((output.content[1] as { thinking: string }).thinking).toBe("thought.");
+    expect((output.content[2] as { text: string }).text).toBe("outro.");
+  });
+
+  it("falls through to reasoning_content when delta.content array yields no supported blocks", async () => {
+    // Locks in the Copilot review concern: an empty array (or an array of only
+    // unsupported block types) must NOT swallow the chunk via an unconditional
+    // `continue`. reasoning_content / tool_calls in the same chunk should still
+    // be processed.
+    const model = {
+      id: "mistral-small-latest",
+      name: "Mistral Small Latest",
+      api: "openai-completions",
+      provider: "mistral",
+      baseUrl: "https://api.mistral.ai/v1",
+      reasoning: true,
+      input: ["text"],
+      cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
+      contextWindow: 128000,
+      maxTokens: 8192,
+    } satisfies Model<"openai-completions">;
+
+    const output = {
+      role: "assistant" as const,
+      content: [],
+      api: model.api,
+      provider: model.provider,
+      model: model.id,
+      usage: {
+        input: 0,
+        output: 0,
+        cacheRead: 0,
+        cacheWrite: 0,
+        totalTokens: 0,
+        cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0, total: 0 },
+      },
+      stopReason: "stop",
+      timestamp: Date.now(),
+    };
+
+    const stream: { push(event: unknown): void } = { push() {} };
+
+    const mockChunks = [
+      {
+        id: "chatcmpl-mistral-fallthrough",
+        object: "chat.completion.chunk" as const,
+        choices: [
+          {
+            index: 0,
+            delta: {
+              content: [{ type: "unknown_block_type", payload: 1 }],
+              reasoning_content: "fallback reasoning",
+            } as Record<string, unknown>,
+            logprobs: null,
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: "chatcmpl-mistral-fallthrough",
+        object: "chat.completion.chunk" as const,
+        choices: [
+          {
+            index: 0,
+            delta: { content: "answer." } as Record<string, unknown>,
+            logprobs: null,
+            finish_reason: null,
+          },
+        ],
+      },
+      {
+        id: "chatcmpl-mistral-fallthrough",
+        object: "chat.completion.chunk" as const,
+        choices: [{ index: 0, delta: {}, logprobs: null, finish_reason: "stop" }],
+      },
+    ] as const;
+
+    async function* mockStream() {
+      for (const chunk of mockChunks) {
+        yield chunk as never;
+      }
+    }
+
+    await __testing.processOpenAICompletionsStream(mockStream(), output, model, stream);
+
+    const thinkingBlock = output.content.find(
+      (block) => (block as { type: string }).type === "thinking",
+    ) as { thinking: string } | undefined;
+    const textBlock = output.content.find(
+      (block) => (block as { type: string }).type === "text",
+    ) as { text: string } | undefined;
+
+    expect(thinkingBlock?.thinking).toBe("fallback reasoning");
+    expect(textBlock?.text).toBe("answer.");
+  });
 });
diff --git a/src/agents/openai-transport-stream.ts b/src/agents/openai-transport-stream.ts
@@ -1124,48 +1124,52 @@ async function processOpenAICompletionsStream(
       // (`[{type:"thinking", thinking:"..."}, {type:"text", text:"..."}]`)
       // instead of a string. JS string concatenation on the array (`"" + arr`)
       // produced literal `"[object Object]"` tokens in the assembled text and a
-      // matching corrupted `text_delta` event. Unpack typed blocks into text +
-      // reasoning deltas, route reasoning blocks through the existing thinking
-      // append path, and only emit a text delta if real text content arrives.
-      // Plain string content keeps the original fast path.
+      // matching corrupted `text_delta` event. Walk the typed blocks in order
+      // and route each one through the existing text / thinking append paths
+      // so transcript block chronology and stream event order match the
+      // provider's original ordering. Plain string content keeps the original
+      // fast path. Unrecognized non-array shapes (including arrays whose blocks
+      // are all unsupported) fall through so reasoning_* and tool_calls in the
+      // same chunk are still processed.
       const unpacked = unpackOpenAICompletionsContent(choice.delta.content);
-      if (unpacked.thinkingDelta.length > 0) {
-        const reasoningDelta = {
-          signature: "content_thinking",
-          text: unpacked.thinkingDelta,
-        };
-        if (currentBlock?.type === "toolCall") {
-          if (!pendingThinkingDelta) {
-            pendingThinkingDelta = { ...reasoningDelta };
+      for (const delta of unpacked.deltas) {
+        if (delta.kind === "thinking") {
+          const reasoningDelta = {
+            signature: "content_thinking",
+            text: delta.value,
+          };
+          if (currentBlock?.type === "toolCall") {
+            if (!pendingThinkingDelta) {
+              pendingThinkingDelta = { ...reasoningDelta };
+            } else {
+              pendingThinkingDelta.text += reasoningDelta.text;
+            }
           } else {
-            pendingThinkingDelta.text += reasoningDelta.text;
+            appendThinkingDelta(reasoningDelta);
           }
-        } else {
-          appendThinkingDelta(reasoningDelta);
+          continue;
         }
-      }
-      if (unpacked.textDelta.length > 0) {
         flushPendingThinkingDelta();
         if (!currentBlock || currentBlock.type !== "text") {
           finishCurrentBlock();
           currentBlock = { type: "text", text: "" };
           output.content.push(currentBlock);
           stream.push({ type: "text_start", contentIndex: blockIndex(), partial: output });
         }
-        currentBlock.text += unpacked.textDelta;
+        currentBlock.text += delta.value;
         stream.push({
           type: "text_delta",
           contentIndex: blockIndex(),
-          delta: unpacked.textDelta,
+          delta: delta.value,
           partial: output,
         });
       }
       if (unpacked.recognized) {
         continue;
       }
-      // Unrecognized truthy non-string shape: fall through to the reasoning /
-      // tool_calls branches below rather than coercing the value into the
-      // assembled text.
+      // Unrecognized truthy non-string / no-supported-block shape: fall through
+      // to the reasoning / tool_calls branches below rather than coercing the
+      // value into the assembled text.
     }
     const reasoningDelta = getCompletionsReasoningDelta(choice.delta as Record<string, unknown>);
     if (reasoningDelta) {
@@ -1233,53 +1237,73 @@ async function processOpenAICompletionsStream(
 //     (e.g. `[{type:"thinking", thinking:"..."}, {type:"text", text:"..."}]`,
 //     observed for Mistral with reasoning enabled where reasoning content
 //     arrives inside `delta.content` instead of a top-level reasoning field).
-// `recognized` is true for both the string fast path and the typed-block array
-// shape. When false (e.g. a plain object or unexpected primitive), the caller
-// falls through to the reasoning/tool_calls branches instead of coercing the
-// value into assembled text.
+// Deltas are returned in the original block order (not coalesced by type) so a
+// `[{type:"text",…},{type:"thinking",…}]` array does not silently flip into
+// thinking-then-text on the consumer side.
+// `recognized` is true for the string fast path and for arrays that yielded at
+// least one supported typed block. Empty arrays or arrays whose blocks are all
+// unsupported shapes return `recognized: false` so reasoning_* and tool_calls
+// fields in the same chunk are still processed by the loop below.
+type OpenAICompletionsContentDelta =
+  | { kind: "text"; value: string }
+  | { kind: "thinking"; value: string };
+
 function unpackOpenAICompletionsContent(rawContent: unknown): {
-  textDelta: string;
-  thinkingDelta: string;
+  deltas: OpenAICompletionsContentDelta[];
   recognized: boolean;
 } {
   if (typeof rawContent === "string") {
-    return { textDelta: rawContent, thinkingDelta: "", recognized: true };
+    return {
+      deltas: rawContent.length > 0 ? [{ kind: "text", value: rawContent }] : [],
+      recognized: true,
+    };
   }
   if (!Array.isArray(rawContent)) {
-    return { textDelta: "", thinkingDelta: "", recognized: false };
+    return { deltas: [], recognized: false };
   }
-  let textDelta = "";
-  let thinkingDelta = "";
+  const deltas: OpenAICompletionsContentDelta[] = [];
+  let sawSupportedBlock = false;
   for (const part of rawContent) {
     if (!part || typeof part !== "object") {
       continue;
     }
     const block = part as { type?: unknown; text?: unknown; thinking?: unknown };
     if (block.type === "text" && typeof block.text === "string") {
-      textDelta += block.text;
+      sawSupportedBlock = true;
+      if (block.text.length > 0) {
+        deltas.push({ kind: "text", value: block.text });
+      }
       continue;
     }
     if (block.type === "thinking") {
       // Mistral reasoning blocks observed in two shapes: `.thinking` as a
       // string, or `.thinking` as a nested array of `{type:"text", text}` parts.
       if (typeof block.thinking === "string") {
-        thinkingDelta += block.thinking;
+        sawSupportedBlock = true;
+        if (block.thinking.length > 0) {
+          deltas.push({ kind: "thinking", value: block.thinking });
+        }
         continue;
       }
       if (Array.isArray(block.thinking)) {
+        let thinkingValue = "";
         for (const sub of block.thinking) {
           if (!sub || typeof sub !== "object") {
             continue;
           }
-          const subText = (sub as { text?: unknown }).text;
-          if (typeof subText === "string") {
-            thinkingDelta += subText;
+          const subBlock = sub as { type?: unknown; text?: unknown };
+          if (subBlock.type === "text" && typeof subBlock.text === "string") {
+            thinkingValue += subBlock.text;
           }
         }
+        sawSupportedBlock = true;
+        if (thinkingValue.length > 0) {
+          deltas.push({ kind: "thinking", value: thinkingValue });
+        }
       }
     }
   }
-  return { textDelta, thinkingDelta, recognized: true };
+  return { deltas, recognized: sawSupportedBlock };
 }
 
 function getCompletionsReasoningDelta(delta: Record<string, unknown>): {