From ad5b3e03652ff7961aa9efd413981f0300fabada Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 16:46:03 +0100
Subject: [PATCH 01/11] feat: endpoint-aware GitHub Copilot model creation

The Copilot branch in providerModelFactory always used
provider.chatModel(), which caused models like gpt-5.4 to fail with
'model is not accessible via the /chat/completions endpoint'.

Changes:
- Add getSupportedEndpoints() and getSupportedEndpointsResolved() helpers
  in modelCapabilities.ts that resolve supported_endpoints from existing
  static metadata (models.json + models-extra.ts), following the same
  lookup-key and merge strategy as getModelCapabilities().
- Update the Copilot branch in providerModelFactory.ts to check endpoint
  metadata and use createOpenAI().responses() when /v1/responses is
  supported, falling back to createOpenAICompatible().chatModel() for
  chat-only or unknown models.
- Add supported_endpoints metadata for gpt-5.4 in models-extra.ts.
- Keep provider name as 'github-copilot' when using createOpenAI so the
  SDK reads provider options from the correct namespace.
- Add focused tests for endpoint resolution in modelCapabilities.test.ts
  and endpoint-aware model creation in providerModelFactory.test.ts.
---
 src/common/utils/ai/modelCapabilities.test.ts | 64 ++++++++++++-
 src/common/utils/ai/modelCapabilities.ts      | 55 +++++++++++
 src/common/utils/tokens/models-extra.ts       |  1 +
 .../services/providerModelFactory.test.ts     | 91 +++++++++++++++++++
 src/node/services/providerModelFactory.ts     | 31 ++++++-
 5 files changed, 239 insertions(+), 3 deletions(-)

diff --git a/src/common/utils/ai/modelCapabilities.test.ts b/src/common/utils/ai/modelCapabilities.test.ts
index a902801b38..683d3f064e 100644
--- a/src/common/utils/ai/modelCapabilities.test.ts
+++ b/src/common/utils/ai/modelCapabilities.test.ts
@@ -1,5 +1,10 @@
 import { describe, expect, it } from "bun:test";
-import { getModelCapabilities, getSupportedInputMediaTypes } from "./modelCapabilities";
+import {
+  getModelCapabilities,
+  getSupportedEndpoints,
+  getSupportedEndpointsResolved,
+  getSupportedInputMediaTypes,
+} from "./modelCapabilities";
 
 describe("getModelCapabilities", () => {
   it("returns capabilities for known models", () => {
@@ -66,3 +71,60 @@ describe("getSupportedInputMediaTypes", () => {
     expect(supported?.has("pdf")).toBe(true);
   });
 });
+
+describe("getSupportedEndpoints", () => {
+  it("returns endpoints for a responses-only model", () => {
+    // gpt-5.4-pro in models-extra has supported_endpoints: ["/v1/responses"]
+    const endpoints = getSupportedEndpoints("openai:gpt-5.4-pro");
+    expect(endpoints).toEqual(["/v1/responses"]);
+  });
+
+  it("returns endpoints for a chat-only Copilot model", () => {
+    // github_copilot/claude-sonnet-4 in models.json has supported_endpoints: ["/v1/chat/completions"]
+    const endpoints = getSupportedEndpoints("github-copilot:claude-sonnet-4");
+    expect(endpoints).toEqual(["/v1/chat/completions"]);
+  });
+
+  it("returns both endpoints for a model supporting chat and responses", () => {
+    // gpt-5.4 in models-extra has supported_endpoints: ["/v1/chat/completions", "/v1/responses"]
+    const endpoints = getSupportedEndpoints("openai:gpt-5.4");
+    expect(endpoints).toContain("/v1/chat/completions");
+    expect(endpoints).toContain("/v1/responses");
+  });
+
+  it("returns endpoints for Copilot model using provider alias lookup", () => {
+    // github_copilot/gpt-5.2 in models.json has both endpoints
+    const endpoints = getSupportedEndpoints("github-copilot:gpt-5.2");
+    expect(endpoints).toContain("/v1/chat/completions");
+    expect(endpoints).toContain("/v1/responses");
+  });
+
+  it("returns null when model metadata exists but has no endpoint info", () => {
+    // claude-opus-4-5 in models-extra has no supported_endpoints
+    const endpoints = getSupportedEndpoints("anthropic:claude-opus-4-5");
+    expect(endpoints).toBeNull();
+  });
+
+  it("returns null for completely unknown models", () => {
+    expect(getSupportedEndpoints("unknown:does-not-exist")).toBeNull();
+  });
+});
+
+describe("getSupportedEndpointsResolved", () => {
+  it("resolves Copilot model with provider-scoped metadata", () => {
+    // github_copilot/gpt-5.1-codex-max in models.json has supported_endpoints: ["/v1/responses"]
+    const endpoints = getSupportedEndpointsResolved("github-copilot:gpt-5.1-codex-max", null);
+    expect(endpoints).toEqual(["/v1/responses"]);
+  });
+
+  it("falls back to bare model name when provider-scoped entry is missing", () => {
+    // github_copilot/gpt-5.4 does NOT exist in models.json, but
+    // bare "gpt-5.4" in models-extra has supported_endpoints.
+    const endpoints = getSupportedEndpointsResolved("github-copilot:gpt-5.4", null);
+    expect(endpoints).toContain("/v1/responses");
+  });
+
+  it("returns null for unknown model without any metadata", () => {
+    expect(getSupportedEndpointsResolved("github-copilot:totally-fake-model", null)).toBeNull();
+  });
+});
diff --git a/src/common/utils/ai/modelCapabilities.ts b/src/common/utils/ai/modelCapabilities.ts
index 952d840050..ee616dc2e5 100644
--- a/src/common/utils/ai/modelCapabilities.ts
+++ b/src/common/utils/ai/modelCapabilities.ts
@@ -11,6 +11,7 @@ interface RawModelCapabilitiesData {
   supports_video_input?: boolean;
   max_pdf_size_mb?: number;
   litellm_provider?: string;
+  supported_endpoints?: string[];
   [key: string]: unknown;
 }
 
@@ -127,3 +128,57 @@ export function getSupportedInputMediaTypes(
   if (caps.supportsVideoInput) result.add("video");
   return result;
 }
+
+/**
+ * Resolve supported API endpoints for a model string from static metadata.
+ *
+ * Returns the `supported_endpoints` array (e.g. `["/v1/responses"]`) when
+ * found in models-extra or models.json, or `null` when no metadata exists.
+ * Follows the same lookup-key + merge strategy as `getModelCapabilities`.
+ */
+export function getSupportedEndpoints(modelString: string): string[] | null {
+  const normalized = normalizeToCanonical(modelString);
+  const lookupKeys = generateLookupKeys(normalized);
+
+  const modelsExtraRecord = modelsExtra as unknown as Record<string, RawModelCapabilitiesData>;
+  const modelsDataRecord = modelsData as unknown as Record<string, RawModelCapabilitiesData>;
+
+  for (const key of lookupKeys) {
+    const base = modelsDataRecord[key];
+    const extra = modelsExtraRecord[key];
+
+    if (base || extra) {
+      // Extra wins for the same field; merge so we don't lose base-only endpoints.
+      const merged: RawModelCapabilitiesData = { ...(base ?? {}), ...(extra ?? {}) };
+      return merged.supported_endpoints ?? null;
+    }
+  }
+
+  return null;
+}
+
+/**
+ * Like `getSupportedEndpoints`, but first resolves config aliases
+ * (e.g. `mappedToModel`) so gateway-scoped model IDs inherit metadata
+ * from the underlying model when the gateway-scoped key has no entry.
+ */
+export function getSupportedEndpointsResolved(
+  modelString: string,
+  providersConfig: ProvidersConfigMap | null
+): string[] | null {
+  // Try the raw (possibly gateway-scoped) key first so provider-specific
+  // endpoint overrides (e.g. `github_copilot/gpt-5.4`) take priority.
+  const direct = getSupportedEndpoints(modelString);
+  if (direct != null) {
+    return direct;
+  }
+
+  // Fall back to the metadata-resolved alias (e.g. mappedToModel) so
+  // models without a provider-scoped entry inherit from the bare model.
+  const metadataModel = resolveModelForMetadata(modelString, providersConfig);
+  if (metadataModel !== modelString) {
+    return getSupportedEndpoints(metadataModel);
+  }
+
+  return null;
+}
diff --git a/src/common/utils/tokens/models-extra.ts b/src/common/utils/tokens/models-extra.ts
index 9c417abc2c..9177977233 100644
--- a/src/common/utils/tokens/models-extra.ts
+++ b/src/common/utils/tokens/models-extra.ts
@@ -113,6 +113,7 @@ export const modelsExtra: Record<string, ModelData> = {
     supports_vision: true,
     supports_reasoning: true,
     supports_response_schema: true,
+    supported_endpoints: ["/v1/chat/completions", "/v1/responses"],
     knowledge_cutoff: "2025-08-31",
   },
 
diff --git a/src/node/services/providerModelFactory.test.ts b/src/node/services/providerModelFactory.test.ts
index 06dc98525a..f33e240031 100644
--- a/src/node/services/providerModelFactory.test.ts
+++ b/src/node/services/providerModelFactory.test.ts
@@ -451,6 +451,97 @@ describe("ProviderModelFactory routing", () => {
   });
 });
 
+describe("ProviderModelFactory Copilot endpoint selection", () => {
+  it("uses responses endpoint for a Copilot model with /v1/responses support", async () => {
+    await withTempConfig(async (config, factory) => {
+      config.saveProvidersConfig({
+        "github-copilot": {
+          apiKey: "ghu_test",
+        },
+      });
+
+      // gpt-5.2 has Copilot-scoped metadata with both /v1/chat/completions and /v1/responses
+      const result = await factory.createModel("github-copilot:gpt-5.2");
+      expect(result.success).toBe(true);
+      if (!result.success) return;
+
+      // When responses endpoint is supported, model provider should include "responses"
+      expect(result.data.provider).toContain("responses");
+    });
+  });
+
+  it("uses responses endpoint for a responses-only Copilot model", async () => {
+    await withTempConfig(async (config, factory) => {
+      config.saveProvidersConfig({
+        "github-copilot": {
+          apiKey: "ghu_test",
+        },
+      });
+
+      // gpt-5.1-codex-max in models.json has supported_endpoints: ["/v1/responses"] only
+      const result = await factory.createModel("github-copilot:gpt-5.1-codex-max");
+      expect(result.success).toBe(true);
+      if (!result.success) return;
+
+      expect(result.data.provider).toContain("responses");
+    });
+  });
+
+  it("uses chat endpoint for a chat-only Copilot model", async () => {
+    await withTempConfig(async (config, factory) => {
+      config.saveProvidersConfig({
+        "github-copilot": {
+          apiKey: "ghu_test",
+        },
+      });
+
+      // claude-sonnet-4 in models.json has supported_endpoints: ["/v1/chat/completions"]
+      const result = await factory.createModel("github-copilot:claude-sonnet-4");
+      expect(result.success).toBe(true);
+      if (!result.success) return;
+
+      expect(result.data.provider).toContain("chat");
+      expect(result.data.provider).not.toContain("responses");
+    });
+  });
+
+  it("falls back to chat endpoint when endpoint metadata is absent", async () => {
+    await withTempConfig(async (config, factory) => {
+      config.saveProvidersConfig({
+        "github-copilot": {
+          apiKey: "ghu_test",
+        },
+      });
+
+      // gpt-4o has no supported_endpoints in either copilot-scoped or bare metadata
+      const result = await factory.createModel("github-copilot:gpt-4o");
+      expect(result.success).toBe(true);
+      if (!result.success) return;
+
+      expect(result.data.provider).toContain("chat");
+      expect(result.data.provider).not.toContain("responses");
+    });
+  });
+
+  it("inherits bare-model endpoint metadata when provider-scoped entry is missing", async () => {
+    await withTempConfig(async (config, factory) => {
+      config.saveProvidersConfig({
+        "github-copilot": {
+          apiKey: "ghu_test",
+        },
+      });
+
+      // github_copilot/gpt-5.4 does NOT exist in models.json,
+      // but bare "gpt-5.4" in models-extra has supported_endpoints with /v1/responses.
+      const result = await factory.createModel("github-copilot:gpt-5.4");
+      expect(result.success).toBe(true);
+      if (!result.success) return;
+
+      expect(result.data.provider).toContain("responses");
+    });
+  });
+});
+
 describe("classifyCopilotInitiator", () => {
   it("returns 'user' when last message role is user", () => {
     const body = JSON.stringify({ messages: [{ role: "user", content: "hello" }] });
diff --git a/src/node/services/providerModelFactory.ts b/src/node/services/providerModelFactory.ts
index acd1d9961f..c80ef9fff4 100644
--- a/src/node/services/providerModelFactory.ts
+++ b/src/node/services/providerModelFactory.ts
@@ -34,6 +34,7 @@ import {
   normalizeToCanonical,
 } from "@/common/utils/ai/models";
 import type { AnthropicCacheTtl } from "@/common/utils/ai/cacheStrategy";
+import { getSupportedEndpointsResolved } from "@/common/utils/ai/modelCapabilities";
 import { MUX_APP_ATTRIBUTION_TITLE, MUX_APP_ATTRIBUTION_URL } from "@/constants/appAttribution";
 import { resolveProviderCredentials } from "@/node/utils/providerRequirements";
 import {
@@ -1488,8 +1489,6 @@ export class ProviderModelFactory {
           return Err({ type: "api_key_not_found", provider: providerName });
         }
 
-        const { createOpenAICompatible } = await PROVIDER_REGISTRY["github-copilot"]();
-
         const baseFetch = getProviderFetch(providerConfig);
         const copilotFetchFn = async (
           input: Parameters<typeof fetch>[0],
@@ -1528,6 +1527,34 @@ export class ProviderModelFactory {
         const providerFetch = copilotFetch;
 
         const baseURL = providerConfig.baseURL ?? "https://api.githubcopilot.com";
+
+        // Determine whether the Copilot model supports the Responses API.
+        // Check provider-scoped metadata first (github_copilot/model), then fall
+        // back to bare-model metadata via alias resolution. Conservative default:
+        // use chat/completions when no endpoint metadata exists.
+        const fullCopilotModelId = `github-copilot:${modelId}`;
+        const endpoints = getSupportedEndpointsResolved(fullCopilotModelId, null);
+        const supportsResponses = endpoints?.includes("/v1/responses") ?? false;
+        // Prefer responses when available; fall back to chat (current behavior)
+        // when only chat is supported or endpoint metadata is absent entirely.
+        const useCopilotResponses = supportsResponses;
+
+        if (useCopilotResponses) {
+          // Use the full OpenAI SDK provider which supports .responses() —
+          // createOpenAICompatible only exposes .chatModel().
+          // Keep provider name as "github-copilot" so the SDK reads provider
+          // options from the correct namespace (matching buildProviderOptions output).
+          const { createOpenAI } = await PROVIDER_REGISTRY.openai();
+          const provider = createOpenAI({
+            name: "github-copilot",
+            baseURL,
+            apiKey: "copilot", // placeholder — actual auth via custom fetch
+            fetch: providerFetch,
+          });
+          return Ok(provider.responses(modelId));
+        }
+
+        const { createOpenAICompatible } = await PROVIDER_REGISTRY["github-copilot"]();
         const provider = createOpenAICompatible({
           name: "github-copilot",
           baseURL,

From 24095861fd70f0a80165c9b003c3efed02a32e7f Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 16:48:29 +0100
Subject: [PATCH 02/11] fix: narrow LanguageModel union type in Copilot
 endpoint tests

The LanguageModel type is a union including string literals, so
accessing .provider requires narrowing. Use a helper function with
a type assertion in tests to extract the provider identifier.
---
 .../services/providerModelFactory.test.ts     | 21 ++++++++++++-------
 1 file changed, 14 insertions(+), 7 deletions(-)

diff --git a/src/node/services/providerModelFactory.test.ts b/src/node/services/providerModelFactory.test.ts
index f33e240031..216d0c0fed 100644
--- a/src/node/services/providerModelFactory.test.ts
+++ b/src/node/services/providerModelFactory.test.ts
@@ -452,6 +452,13 @@ describe("ProviderModelFactory routing", () => {
 });
 
 describe("ProviderModelFactory Copilot endpoint selection", () => {
+  // Helper: extract the SDK provider identifier from a LanguageModel.
+  // At runtime createModel always returns an object model (LanguageModelV3),
+  // but the TS union type includes string literals so we narrow here.
+  function getModelProvider(model: unknown): string {
+    return (model as { provider: string }).provider;
+  }
+
   it("uses responses endpoint for a Copilot model with /v1/responses support", async () => {
     await withTempConfig(async (config, factory) => {
       config.saveProvidersConfig({
@@ -466,7 +473,7 @@ describe("ProviderModelFactory Copilot endpoint selection", () => {
       if (!result.success) return;
 
       // When responses endpoint is supported, model provider should include "responses"
-      expect(result.data.provider).toContain("responses");
+      expect(getModelProvider(result.data)).toContain("responses");
     });
   });
 
@@ -483,7 +490,7 @@ describe("ProviderModelFactory Copilot endpoint selection", () => {
       expect(result.success).toBe(true);
       if (!result.success) return;
 
-      expect(result.data.provider).toContain("responses");
+      expect(getModelProvider(result.data)).toContain("responses");
     });
   });
 
@@ -500,8 +507,8 @@ describe("ProviderModelFactory Copilot endpoint selection", () => {
       expect(result.success).toBe(true);
       if (!result.success) return;
 
-      expect(result.data.provider).toContain("chat");
-      expect(result.data.provider).not.toContain("responses");
+      expect(getModelProvider(result.data)).toContain("chat");
+      expect(getModelProvider(result.data)).not.toContain("responses");
     });
   });
 
@@ -518,8 +525,8 @@ describe("ProviderModelFactory Copilot endpoint selection", () => {
       expect(result.success).toBe(true);
       if (!result.success) return;
 
-      expect(result.data.provider).toContain("chat");
-      expect(result.data.provider).not.toContain("responses");
+      expect(getModelProvider(result.data)).toContain("chat");
+      expect(getModelProvider(result.data)).not.toContain("responses");
     });
   });
 
@@ -537,7 +544,7 @@ describe("ProviderModelFactory Copilot endpoint selection", () => {
       expect(result.success).toBe(true);
       if (!result.success) return;
 
-      expect(result.data.provider).toContain("responses");
+      expect(getModelProvider(result.data)).toContain("responses");
     });
   });
 });

From 5ad04459e15c3b775d9f0123b6208d3855d2471c Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 16:55:50 +0100
Subject: [PATCH 03/11] fix(modelCapabilities): prefer provider-scoped keys
 over bare model in lookup

generateLookupKeys() previously placed the bare model name first in the
lookup array, so provider-specific metadata (e.g. github_copilot/gpt-5.2
omitting /v1/batch) was shadowed by the generic bare-model entry that
includes /v1/batch.

Reorder so provider-scoped keys are checked first when a provider prefix
is present, with bare model name as the last-resort fallback.

Add tests proving:
- Provider-scoped endpoints win over bare model (no /v1/batch leak)
- Bare model fallback still works when provider-scoped entry is absent
- Both getSupportedEndpoints and getSupportedEndpointsResolved tested
---
 src/common/utils/ai/modelCapabilities.test.ts | 20 +++++++++++++++++++
 src/common/utils/ai/modelCapabilities.ts      | 10 +++++++---
 2 files changed, 27 insertions(+), 3 deletions(-)

diff --git a/src/common/utils/ai/modelCapabilities.test.ts b/src/common/utils/ai/modelCapabilities.test.ts
index 683d3f064e..165346813a 100644
--- a/src/common/utils/ai/modelCapabilities.test.ts
+++ b/src/common/utils/ai/modelCapabilities.test.ts
@@ -99,6 +99,17 @@ describe("getSupportedEndpoints", () => {
     expect(endpoints).toContain("/v1/responses");
   });
 
+  it("prefers provider-scoped endpoints over bare model endpoints", () => {
+    // bare "gpt-5.2" includes /v1/batch, but github_copilot/gpt-5.2 does not.
+    // The provider-scoped entry should win when queried with a provider prefix.
+    const endpoints = getSupportedEndpoints("github-copilot:gpt-5.2");
+    expect(endpoints).not.toContain("/v1/batch");
+
+    // Sanity: the bare model does include /v1/batch
+    const bareEndpoints = getSupportedEndpoints("gpt-5.2");
+    expect(bareEndpoints).toContain("/v1/batch");
+  });
+
   it("returns null when model metadata exists but has no endpoint info", () => {
     // claude-opus-4-5 in models-extra has no supported_endpoints
     const endpoints = getSupportedEndpoints("anthropic:claude-opus-4-5");
@@ -117,6 +128,15 @@ describe("getSupportedEndpointsResolved", () => {
     expect(endpoints).toEqual(["/v1/responses"]);
   });
 
+  it("prefers provider-scoped endpoints over bare model in resolved path", () => {
+    // github_copilot/gpt-5.2 restricts to chat+responses (no /v1/batch),
+    // while bare gpt-5.2 includes /v1/batch. Provider-scoped must win.
+    const endpoints = getSupportedEndpointsResolved("github-copilot:gpt-5.2", null);
+    expect(endpoints).toContain("/v1/chat/completions");
+    expect(endpoints).toContain("/v1/responses");
+    expect(endpoints).not.toContain("/v1/batch");
+  });
+
   it("falls back to bare model name when provider-scoped entry is missing", () => {
     // github_copilot/gpt-5.4 does NOT exist in models.json, but
     // bare "gpt-5.4" in models-extra has supported_endpoints.
diff --git a/src/common/utils/ai/modelCapabilities.ts b/src/common/utils/ai/modelCapabilities.ts
index ee616dc2e5..0232619f6b 100644
--- a/src/common/utils/ai/modelCapabilities.ts
+++ b/src/common/utils/ai/modelCapabilities.ts
@@ -42,11 +42,12 @@ function generateLookupKeys(modelString: string): string[] {
   const modelName = colonIndex !== -1 ? modelString.slice(colonIndex + 1) : modelString;
   const litellmProvider = PROVIDER_KEY_ALIASES[provider] ?? provider;
 
-  const keys: string[] = [
-    modelName, // Direct model name (e.g., "claude-opus-4-5")
-  ];
+  const keys: string[] = [];
 
   if (provider) {
+    // Provider-scoped keys first so provider-specific metadata (e.g.
+    // `github_copilot/gpt-5.2` restricting `/v1/batch`) wins over the
+    // generic bare-model entry.
     keys.push(
       `${litellmProvider}/${modelName}`, // "ollama/gpt-oss:20b"
       `${litellmProvider}/${modelName}-cloud` // "ollama/gpt-oss:20b-cloud" (LiteLLM convention)
@@ -60,6 +61,9 @@ function generateLookupKeys(modelString: string): string[] {
     }
   }
 
+  // Bare model name is the last-resort fallback.
+  keys.push(modelName);
+
   return keys;
 }
 

From 62e88f116b5d23a8b03934a040628123539f12a5 Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 17:02:27 +0100
Subject: [PATCH 04/11] fix: pass providersConfig to Copilot endpoint
 resolution

The github-copilot branch in providerModelFactory called
getSupportedEndpointsResolved(fullCopilotModelId, null), skipping the
config-aware alias path (mappedToModel) that the helper was designed
to support. The in-scope providersConfig was already loaded earlier in
the method.

- Pass providersConfig instead of null so Copilot endpoint resolution
  can follow mappedToModel aliases in the providers config.
- Widen the parameter type of getSupportedEndpointsResolved and its
  helper chain (resolveModelForMetadata, getModelContextWindowOverride,
  getModelCapabilitiesResolved) from ProvidersConfigMap to a minimal
  ProvidersConfigWithModels interface. Both the raw disk config and
  the API-facing map satisfy this, eliminating the need for callers
  to convert between config shapes.
- Add two focused tests proving config-based alias resolution works
  for endpoint selection and that null config returns null for the
  same unknown model.
---
 src/common/utils/ai/modelCapabilities.test.ts | 17 ++++++++++++++++
 src/common/utils/ai/modelCapabilities.ts      |  6 +++---
 src/common/utils/providers/modelEntries.ts    | 20 ++++++++++++++-----
 src/node/services/providerModelFactory.ts     |  2 +-
 4 files changed, 36 insertions(+), 9 deletions(-)

diff --git a/src/common/utils/ai/modelCapabilities.test.ts b/src/common/utils/ai/modelCapabilities.test.ts
index 165346813a..2eb3c92e3a 100644
--- a/src/common/utils/ai/modelCapabilities.test.ts
+++ b/src/common/utils/ai/modelCapabilities.test.ts
@@ -144,6 +144,23 @@ describe("getSupportedEndpointsResolved", () => {
     expect(endpoints).toContain("/v1/responses");
   });
 
+  it("resolves endpoints via config-based mappedToModel alias", () => {
+    // "custom-copilot-alias" has no provider-scoped or bare-model metadata,
+    // but the providers config maps it to gpt-5.4 which has known endpoints.
+    const config = {
+      "github-copilot": {
+        models: [{ id: "custom-copilot-alias", mappedToModel: "gpt-5.4" }],
+      },
+    };
+    const endpoints = getSupportedEndpointsResolved("github-copilot:custom-copilot-alias", config);
+    expect(endpoints).toContain("/v1/responses");
+  });
+
+  it("returns null for unknown model when config has no mapping", () => {
+    // Without config, the same unknown model returns null.
+    expect(getSupportedEndpointsResolved("github-copilot:custom-copilot-alias", null)).toBeNull();
+  });
+
   it("returns null for unknown model without any metadata", () => {
     expect(getSupportedEndpointsResolved("github-copilot:totally-fake-model", null)).toBeNull();
   });
diff --git a/src/common/utils/ai/modelCapabilities.ts b/src/common/utils/ai/modelCapabilities.ts
index 0232619f6b..24e9bcb11d 100644
--- a/src/common/utils/ai/modelCapabilities.ts
+++ b/src/common/utils/ai/modelCapabilities.ts
@@ -1,4 +1,4 @@
-import type { ProvidersConfigMap } from "@/common/orpc/types";
+import type { ProvidersConfigWithModels } from "@/common/utils/providers/modelEntries";
 import { resolveModelForMetadata } from "@/common/utils/providers/modelEntries";
 import modelsData from "../tokens/models.json";
 import { modelsExtra } from "../tokens/models-extra";
@@ -113,7 +113,7 @@ export function getModelCapabilities(modelString: string): ModelCapabilities | n
 
 export function getModelCapabilitiesResolved(
   modelString: string,
-  providersConfig: ProvidersConfigMap | null
+  providersConfig: ProvidersConfigWithModels | null
 ): ModelCapabilities | null {
   const metadataModel = resolveModelForMetadata(modelString, providersConfig);
   return getModelCapabilities(metadataModel);
@@ -168,7 +168,7 @@ export function getSupportedEndpoints(modelString: string): string[] | null {
  */
 export function getSupportedEndpointsResolved(
   modelString: string,
-  providersConfig: ProvidersConfigMap | null
+  providersConfig: ProvidersConfigWithModels | null
 ): string[] | null {
   // Try the raw (possibly gateway-scoped) key first so provider-specific
   // endpoint overrides (e.g. `github_copilot/gpt-5.4`) take priority.
diff --git a/src/common/utils/providers/modelEntries.ts b/src/common/utils/providers/modelEntries.ts
index 03841c57d6..54588d02be 100644
--- a/src/common/utils/providers/modelEntries.ts
+++ b/src/common/utils/providers/modelEntries.ts
@@ -1,6 +1,16 @@
-import type { ProviderModelEntry, ProvidersConfigMap } from "@/common/orpc/types";
+import type { ProviderModelEntry } from "@/common/orpc/types";
 import { normalizeToCanonical } from "@/common/utils/ai/models";
 
+/**
+ * Minimal providers-config shape needed for model-entry lookup.
+ * Both the raw disk config (`ProvidersConfig`) and the API-facing map
+ * (`ProvidersConfigMap`) satisfy this, so callers don't need to convert.
+ */
+export type ProvidersConfigWithModels = Record<
+  string,
+  { models?: ProviderModelEntry[] } | undefined
+>;
+
 interface ParsedProviderModelId {
   provider: string;
   modelId: string;
@@ -37,7 +47,7 @@ function parseProviderModelId(fullModelId: string): ParsedProviderModelId | null
 }
 
 function findProviderModelEntry(
-  providersConfig: ProvidersConfigMap | null,
+  providersConfig: ProvidersConfigWithModels | null,
   provider: string,
   modelId: string
 ): ProviderModelEntry | null {
@@ -65,7 +75,7 @@ function findProviderModelEntry(
  */
 function findProviderModelEntryScoped(
   fullModelId: string,
-  providersConfig: ProvidersConfigMap | null
+  providersConfig: ProvidersConfigWithModels | null
 ): ProviderModelEntry | null {
   const rawParsed = parseProviderModelId(fullModelId);
   if (rawParsed) {
@@ -94,7 +104,7 @@ function findProviderModelEntryScoped(
 
 export function getModelContextWindowOverride(
   fullModelId: string,
-  providersConfig: ProvidersConfigMap | null
+  providersConfig: ProvidersConfigWithModels | null
 ): number | null {
   const entry = findProviderModelEntryScoped(fullModelId, providersConfig);
   return entry ? getProviderModelEntryContextWindowTokens(entry) : null;
@@ -102,7 +112,7 @@ export function getModelContextWindowOverride(
 
 export function resolveModelForMetadata(
   fullModelId: string,
-  providersConfig: ProvidersConfigMap | null
+  providersConfig: ProvidersConfigWithModels | null
 ): string {
   const entry = findProviderModelEntryScoped(fullModelId, providersConfig);
   return (entry ? getProviderModelEntryMappedTo(entry) : null) ?? fullModelId;
diff --git a/src/node/services/providerModelFactory.ts b/src/node/services/providerModelFactory.ts
index c80ef9fff4..b7cadb1034 100644
--- a/src/node/services/providerModelFactory.ts
+++ b/src/node/services/providerModelFactory.ts
@@ -1533,7 +1533,7 @@ export class ProviderModelFactory {
         // back to bare-model metadata via alias resolution. Conservative default:
         // use chat/completions when no endpoint metadata exists.
         const fullCopilotModelId = `github-copilot:${modelId}`;
-        const endpoints = getSupportedEndpointsResolved(fullCopilotModelId, null);
+        const endpoints = getSupportedEndpointsResolved(fullCopilotModelId, providersConfig);
         const supportsResponses = endpoints?.includes("/v1/responses") ?? false;
         // Prefer responses when available; fall back to chat (current behavior)
         // when only chat is supported or endpoint metadata is absent entirely.

From 8e5a7fbc7941fe7913a40ecdddac153dfca6051f Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 21:02:02 +0100
Subject: [PATCH 05/11] fix: add Copilot Responses streaming adapter
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Wrap GitHub Copilot's Responses-capable LanguageModelV3 to rebuild
coherent V3 stream parts from raw SSE events, compensating for
ordering differences in Copilot's /v1/responses endpoint.

The wrapper:
- Forces includeRawChunks: true on the inner model
- Suppresses the inner model's text/tool semantic parts
- Rebuilds text-start/delta/end and tool-input-start/delta/end/tool-call
  from raw Responses events keyed by item_id + output_index
- Passes through everything else unchanged (finish, response-metadata,
  reasoning-*, source, raw, error, etc.)

Only touches the doStream path; doGenerate is delegated unchanged.
Wired into providerModelFactory.ts for the github-copilot /v1/responses
branch only — non-Copilot providers and Copilot chat-completions are
unchanged.
---
 .../__tests__/copilotResponsesModel.test.ts   | 585 ++++++++++++++++++
 src/node/services/copilotResponsesModel.ts    | 387 ++++++++++++
 src/node/services/providerModelFactory.ts     |   3 +-
 3 files changed, 974 insertions(+), 1 deletion(-)
 create mode 100644 src/node/services/__tests__/copilotResponsesModel.test.ts
 create mode 100644 src/node/services/copilotResponsesModel.ts

diff --git a/src/node/services/__tests__/copilotResponsesModel.test.ts b/src/node/services/__tests__/copilotResponsesModel.test.ts
new file mode 100644
index 0000000000..42fac1cb32
--- /dev/null
+++ b/src/node/services/__tests__/copilotResponsesModel.test.ts
@@ -0,0 +1,585 @@
+import { describe, expect, it } from "bun:test";
+import type {
+  LanguageModelV3,
+  LanguageModelV3CallOptions,
+  LanguageModelV3FinishReason,
+  LanguageModelV3StreamPart,
+  LanguageModelV3StreamResult,
+  LanguageModelV3Usage,
+} from "@ai-sdk/provider";
+import { wrapCopilotResponsesModel } from "../copilotResponsesModel";
+
+// ---------------------------------------------------------------------------
+// Test helpers
+// ---------------------------------------------------------------------------
+
+/** Minimal stub LanguageModelV3 whose doStream returns a hand-crafted stream. */
+function createStubModel(
+  streamParts: LanguageModelV3StreamPart[]
+): LanguageModelV3 & { lastStreamOptions: LanguageModelV3CallOptions | null } {
+  const stub = {
+    specificationVersion: "v3" as const,
+    provider: "github-copilot.responses",
+    modelId: "gpt-5.2",
+    supportedUrls: {},
+    lastStreamOptions: null as LanguageModelV3CallOptions | null,
+
+    doGenerate: () => {
+      throw new Error("doGenerate not implemented in stub");
+    },
+
+    doStream(options: LanguageModelV3CallOptions): PromiseLike<LanguageModelV3StreamResult> {
+      stub.lastStreamOptions = options;
+      return Promise.resolve({
+        stream: new ReadableStream<LanguageModelV3StreamPart>({
+          start(controller) {
+            for (const part of streamParts) {
+              controller.enqueue(part);
+            }
+            controller.close();
+          },
+        }),
+      });
+    },
+  };
+  return stub;
+}
+
+/** Collect all parts from a ReadableStream. */
+async function collectStream(
+  stream: ReadableStream<LanguageModelV3StreamPart>
+): Promise<LanguageModelV3StreamPart[]> {
+  const parts: LanguageModelV3StreamPart[] = [];
+  const reader = stream.getReader();
+  for (;;) {
+    const { done, value } = await reader.read();
+    if (done) break;
+    parts.push(value);
+  }
+  return parts;
+}
+
+/** Build a raw chunk wrapping a Responses SSE event. */
+function raw(event: Record<string, unknown>): LanguageModelV3StreamPart {
+  return { type: "raw", rawValue: event };
+}
+
+/** Build a V3-compliant usage object for tests. */
+function makeUsage(inputTotal: number, outputTotal: number): LanguageModelV3Usage {
+  return {
+    inputTokens: {
+      total: inputTotal,
+      noCache: undefined,
+      cacheRead: undefined,
+      cacheWrite: undefined,
+    },
+    outputTokens: { total: outputTotal, text: undefined, reasoning: undefined },
+  };
+}
+
+/** Build a finish stream part with V3-compliant usage. */
+function finish(
+  reason: LanguageModelV3FinishReason["unified"],
+  inputTotal: number,
+  outputTotal: number
+): LanguageModelV3StreamPart {
+  // Use a typed variable to satisfy consistent-type-assertions lint rule.
+  const part: LanguageModelV3StreamPart = {
+    type: "finish",
+    finishReason: { unified: reason, raw: reason },
+    usage: makeUsage(inputTotal, outputTotal),
+  };
+  return part;
+}
+
+// ---------------------------------------------------------------------------
+// Minimal stub call options
+// ---------------------------------------------------------------------------
+const baseOptions: LanguageModelV3CallOptions = {
+  prompt: [],
+};
+
+// ---------------------------------------------------------------------------
+// Tests
+// ---------------------------------------------------------------------------
+
+describe("wrapCopilotResponsesModel", () => {
+  describe("text lifecycle", () => {
+    it("rebuilds coherent text-start / text-delta / text-end from raw events", async () => {
+      const messageItemId = "msg_001";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Hello",
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: " world",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 10, 5),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      // Should see coherent lifecycle from our wrapper
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual([
+        "text-start", // from response.output_item.added (message)
+        "text-delta", // from response.output_text.delta "Hello"
+        "text-delta", // from response.output_text.delta " world"
+        "text-end", // from response.output_item.done (message)
+        "finish",
+      ]);
+
+      // Verify text content
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas.map((d) => d.delta)).toEqual(["Hello", " world"]);
+    });
+
+    it("handles orphaned text deltas (delta before output_item.added)", async () => {
+      const messageItemId = "msg_orphan";
+      const stub = createStubModel([
+        // Copilot sends text delta BEFORE output_item.added — the wrapper should
+        // defensively emit text-start when it sees the first delta for an unknown item.
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Early",
+        }),
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: " text",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 5, 3),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      // The first delta triggers a defensive text-start.
+      // The output_item.added for message also triggers text-start (for a new key).
+      // But both share the same itemId, so output_item.done closes them.
+      expect(types).toContain("text-start");
+      expect(types).toContain("text-delta");
+      expect(types).toContain("text-end");
+      expect(types).toContain("finish");
+
+      // The deltas should both be present
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas.map((d) => d.delta)).toContain("Early");
+      expect(deltas.map((d) => d.delta)).toContain(" text");
+    });
+  });
+
+  describe("inner semantic part suppression", () => {
+    it("suppresses inner text-start/text-delta/text-end and rebuilds from raw", async () => {
+      // Simulates what the real inner model emits: both raw events AND semantic parts.
+      // The wrapper should suppress the semantic parts and only emit its own rebuilds.
+      const innerTextStart: LanguageModelV3StreamPart = { type: "text-start", id: "msg_sup" };
+      const innerTextDelta: LanguageModelV3StreamPart = {
+        type: "text-delta",
+        id: "msg_sup",
+        delta: "Hi",
+      };
+      const innerTextEnd: LanguageModelV3StreamPart = { type: "text-end", id: "msg_sup" };
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "msg_sup", type: "message" },
+          output_index: 0,
+        }),
+        innerTextStart,
+        raw({
+          type: "response.output_text.delta",
+          item_id: "msg_sup",
+          content_index: 0,
+          delta: "Hi",
+        }),
+        innerTextDelta,
+        raw({
+          type: "response.output_item.done",
+          item: { id: "msg_sup", type: "message" },
+          output_index: 0,
+        }),
+        innerTextEnd,
+        finish("stop", 1, 1),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      // Should have exactly one text-start, one text-delta, one text-end — no duplicates
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual(["text-start", "text-delta", "text-end", "finish"]);
+    });
+
+    it("suppresses inner tool-input-start/delta/end/tool-call and rebuilds from raw", async () => {
+      const innerToolStart: LanguageModelV3StreamPart = {
+        type: "tool-input-start",
+        id: "call_sup",
+        toolName: "bash",
+      };
+      const innerToolDelta: LanguageModelV3StreamPart = {
+        type: "tool-input-delta",
+        id: "call_sup",
+        delta: "{}",
+      };
+      const innerToolEnd: LanguageModelV3StreamPart = { type: "tool-input-end", id: "call_sup" };
+      const innerToolCall: LanguageModelV3StreamPart = {
+        type: "tool-call",
+        toolCallId: "call_sup",
+        toolName: "bash",
+        input: "{}",
+      };
+
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "fc_sup", type: "function_call", call_id: "call_sup", name: "bash" },
+          output_index: 0,
+        }),
+        innerToolStart,
+        raw({ type: "response.function_call_arguments.delta", output_index: 0, delta: "{}" }),
+        innerToolDelta,
+        raw({
+          type: "response.output_item.done",
+          item: {
+            id: "fc_sup",
+            type: "function_call",
+            call_id: "call_sup",
+            name: "bash",
+            arguments: "{}",
+          },
+          output_index: 0,
+        }),
+        innerToolEnd,
+        innerToolCall,
+        finish("tool-calls", 1, 1),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      // Should have exactly one of each — no duplicates from inner parts
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual([
+        "tool-input-start",
+        "tool-input-delta",
+        "tool-input-end",
+        "tool-call",
+        "finish",
+      ]);
+    });
+  });
+
+  describe("tool call lifecycle", () => {
+    it("rebuilds tool-input-start / delta / end / tool-call from raw events", async () => {
+      const callId = "call_abc123";
+      const toolName = "bash";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "fc_001", type: "function_call", call_id: callId, name: toolName },
+          output_index: 0,
+        }),
+        raw({ type: "response.function_call_arguments.delta", output_index: 0, delta: '{"script' }),
+        raw({ type: "response.function_call_arguments.delta", output_index: 0, delta: '":"ls"}' }),
+        raw({
+          type: "response.output_item.done",
+          item: {
+            id: "fc_001",
+            type: "function_call",
+            call_id: callId,
+            name: toolName,
+            arguments: '{"script":"ls"}',
+          },
+          output_index: 0,
+        }),
+        finish("tool-calls", 20, 10),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual([
+        "tool-input-start",
+        "tool-input-delta",
+        "tool-input-delta",
+        "tool-input-end",
+        "tool-call",
+        "finish",
+      ]);
+
+      // Verify tool-call has correct args from output_item.done
+      const toolCall = parts.find((p) => p.type === "tool-call") as {
+        type: "tool-call";
+        toolCallId: string;
+        toolName: string;
+        input: string;
+      };
+      expect(toolCall.toolCallId).toBe(callId);
+      expect(toolCall.toolName).toBe(toolName);
+      expect(toolCall.input).toBe('{"script":"ls"}');
+    });
+  });
+
+  describe("finish / usage passthrough", () => {
+    it("passes through finish and response-metadata unchanged", async () => {
+      const responseMetadata: LanguageModelV3StreamPart = {
+        type: "response-metadata",
+        id: "resp_001",
+        timestamp: new Date("2024-01-01"),
+        modelId: "gpt-5.2",
+      };
+      const stub = createStubModel([responseMetadata, finish("stop", 100, 50)]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      expect(parts).toHaveLength(2);
+      expect(parts[0].type).toBe("response-metadata");
+      expect(parts[1].type).toBe("finish");
+
+      const finishPart = parts[1] as { type: "finish"; usage: unknown; finishReason: unknown };
+      expect(finishPart.usage).toEqual(makeUsage(100, 50));
+    });
+  });
+
+  describe("terminal failure", () => {
+    it("emits error part from response.failed raw event", async () => {
+      const stub = createStubModel([
+        raw({
+          type: "response.failed",
+          response: { error: { message: "Rate limit exceeded", code: "rate_limit" } },
+        }),
+        finish("error", 0, 0),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const errorPart = parts.find((p) => p.type === "error");
+      expect(errorPart).toBeDefined();
+      expect((errorPart as { type: "error"; error: unknown }).error).toEqual({
+        message: "Rate limit exceeded",
+        code: "rate_limit",
+      });
+    });
+  });
+
+  describe("raw chunk passthrough", () => {
+    it("forwards raw chunks when outer caller requested them", async () => {
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "msg_r", type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: "msg_r",
+          content_index: 0,
+          delta: "Hi",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: "msg_r", type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 1, 1),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream({ ...baseOptions, includeRawChunks: true });
+      const parts = await collectStream(result.stream);
+
+      // Should include raw chunks alongside rebuilt semantic parts
+      const rawParts = parts.filter((p) => p.type === "raw");
+      expect(rawParts.length).toBeGreaterThanOrEqual(3);
+
+      // Should also include rebuilt semantic parts
+      const types = parts.filter((p) => p.type !== "raw").map((p) => p.type);
+      expect(types).toEqual(["text-start", "text-delta", "text-end", "finish"]);
+    });
+
+    it("suppresses raw chunks when outer caller did not request them", async () => {
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "msg_s", type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: "msg_s",
+          content_index: 0,
+          delta: "Hi",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: "msg_s", type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 1, 1),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions); // no includeRawChunks
+      const parts = await collectStream(result.stream);
+
+      // Should NOT include any raw chunks
+      expect(parts.filter((p) => p.type === "raw")).toHaveLength(0);
+
+      // Should include rebuilt semantic parts
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual(["text-start", "text-delta", "text-end", "finish"]);
+    });
+  });
+
+  describe("includeRawChunks forwarding", () => {
+    it("always passes includeRawChunks: true to the inner model", async () => {
+      const stub = createStubModel([finish("stop", 0, 0)]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+
+      // Call without includeRawChunks
+      await wrapped.doStream(baseOptions);
+      expect(stub.lastStreamOptions?.includeRawChunks).toBe(true);
+    });
+  });
+
+  describe("doGenerate passthrough", () => {
+    it("delegates doGenerate to the inner model unchanged", async () => {
+      const expectedResult = {
+        content: [],
+        text: "test",
+        usage: makeUsage(5, 3),
+        finishReason: { unified: "stop" as const, raw: "stop" },
+        response: {},
+        warnings: [],
+      };
+
+      const stub = createStubModel([]);
+      stub.doGenerate = () => Promise.resolve(expectedResult) as never;
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doGenerate(baseOptions);
+      expect(result).toBe(expectedResult);
+    });
+  });
+
+  describe("mixed text and tool calls", () => {
+    it("handles interleaved text and tool call events", async () => {
+      const msgId = "msg_mixed";
+      const callId = "call_mixed";
+      const stub = createStubModel([
+        // Text message starts
+        raw({
+          type: "response.output_item.added",
+          item: { id: msgId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: msgId,
+          content_index: 0,
+          delta: "Let me ",
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: msgId,
+          content_index: 0,
+          delta: "check.",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: msgId, type: "message" },
+          output_index: 0,
+        }),
+        // Tool call
+        raw({
+          type: "response.output_item.added",
+          item: { id: "fc_m", type: "function_call", call_id: callId, name: "file_read" },
+          output_index: 1,
+        }),
+        raw({
+          type: "response.function_call_arguments.delta",
+          output_index: 1,
+          delta: '{"path":"test.ts"}',
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: {
+            id: "fc_m",
+            type: "function_call",
+            call_id: callId,
+            name: "file_read",
+            arguments: '{"path":"test.ts"}',
+          },
+          output_index: 1,
+        }),
+        finish("tool-calls", 30, 15),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual([
+        "text-start",
+        "text-delta",
+        "text-delta",
+        "text-end",
+        "tool-input-start",
+        "tool-input-delta",
+        "tool-input-end",
+        "tool-call",
+        "finish",
+      ]);
+    });
+  });
+});
diff --git a/src/node/services/copilotResponsesModel.ts b/src/node/services/copilotResponsesModel.ts
new file mode 100644
index 0000000000..3485387303
--- /dev/null
+++ b/src/node/services/copilotResponsesModel.ts
@@ -0,0 +1,387 @@
+/**
+ * Copilot-only Responses streaming adapter.
+ *
+ * GitHub Copilot's /v1/responses endpoint can emit Responses API events
+ * in an order that differs from the standard OpenAI Responses API, causing
+ * the upstream SDK's V3 stream part translation to produce broken lifecycles
+ * (e.g., orphaned text-deltas, missing text-start/text-end pairs, or
+ * tool-call parts arriving before tool-input-end).
+ *
+ * This module wraps a Responses-capable LanguageModelV3 and rebuilds
+ * coherent V3 stream parts from raw SSE events. It only touches the
+ * `doStream` path; `doGenerate` is delegated unchanged.
+ *
+ * The wrapper:
+ *  - Forces `includeRawChunks: true` on the inner model
+ *  - Suppresses the inner model's text/tool semantic parts (which may be broken)
+ *  - Rebuilds text-start/text-delta/text-end and tool-input-start/delta/end/tool-call
+ *    from raw Responses events keyed by item_id + content_index / output_index
+ *  - Passes through everything else unchanged (finish, response-metadata,
+ *    reasoning-*, source, raw, etc.)
+ */
+
+import type {
+  LanguageModelV3,
+  LanguageModelV3CallOptions,
+  LanguageModelV3StreamPart,
+  LanguageModelV3StreamResult,
+} from "@ai-sdk/provider";
+
+// ---------------------------------------------------------------------------
+// Raw Responses event type guards
+// ---------------------------------------------------------------------------
+
+interface RawResponsesEvent {
+  type: string;
+  [key: string]: unknown;
+}
+
+function isRawEvent(value: unknown): value is RawResponsesEvent {
+  return (
+    typeof value === "object" &&
+    value != null &&
+    typeof (value as RawResponsesEvent).type === "string"
+  );
+}
+
+// response.output_item.added — item: { type: "message" | "function_call" | ... }
+function isOutputItemAdded(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.output_item.added";
+}
+
+// response.output_item.done
+function isOutputItemDone(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.output_item.done";
+}
+
+// response.output_text.delta
+function isTextDelta(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.output_text.delta";
+}
+
+// response.function_call_arguments.delta
+function isFunctionCallArgsDelta(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.function_call_arguments.delta";
+}
+
+// response.failed
+function isResponseFailed(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.failed";
+}
+
+// ---------------------------------------------------------------------------
+// Helpers to extract fields from raw events
+// ---------------------------------------------------------------------------
+
+function getItemId(ev: RawResponsesEvent): string | undefined {
+  // Some events use `item_id`, output_item events nest under `item.id`
+  if (typeof ev.item_id === "string") return ev.item_id;
+  const item = ev.item as Record<string, unknown> | undefined;
+  if (item && typeof item.id === "string") return item.id;
+  return undefined;
+}
+
+function getItemType(ev: RawResponsesEvent): string | undefined {
+  const item = ev.item as Record<string, unknown> | undefined;
+  return item && typeof item.type === "string" ? item.type : undefined;
+}
+
+function getOutputIndex(ev: RawResponsesEvent): number {
+  return typeof ev.output_index === "number" ? ev.output_index : 0;
+}
+
+function getContentIndex(ev: RawResponsesEvent): number {
+  return typeof ev.content_index === "number" ? ev.content_index : 0;
+}
+
+function getDelta(ev: RawResponsesEvent): string {
+  return typeof ev.delta === "string" ? ev.delta : "";
+}
+
+// ---------------------------------------------------------------------------
+// Semantic part types suppressed from the inner stream
+// ---------------------------------------------------------------------------
+
+/** Parts the wrapper rebuilds from raw events — suppress the inner model's versions. */
+const SUPPRESSED_INNER_TYPES = new Set<string>([
+  "text-start",
+  "text-delta",
+  "text-end",
+  "tool-input-start",
+  "tool-input-delta",
+  "tool-input-end",
+  "tool-call",
+]);
+
+// ---------------------------------------------------------------------------
+// Tracking state for open text / tool parts
+// ---------------------------------------------------------------------------
+
+interface OpenTextPart {
+  itemId: string;
+  started: boolean;
+}
+
+interface OpenToolCall {
+  itemId: string;
+  callId: string;
+  toolName: string;
+  args: string;
+  started: boolean;
+  finalized: boolean;
+}
+
+// ---------------------------------------------------------------------------
+// Stream transformer
+// ---------------------------------------------------------------------------
+
+function createCopilotResponsesTransform(
+  outerWantsRaw: boolean
+): TransformStream<LanguageModelV3StreamPart, LanguageModelV3StreamPart> {
+  // Track open text parts by `${itemId}:${contentIndex}`
+  const openTexts = new Map<string, OpenTextPart>();
+  // Track open tool calls by output_index
+  const openTools = new Map<number, OpenToolCall>();
+
+  return new TransformStream<LanguageModelV3StreamPart, LanguageModelV3StreamPart>({
+    transform(chunk, controller) {
+      // Always forward raw chunks if the outer caller wanted them
+      if (chunk.type === "raw") {
+        if (outerWantsRaw) {
+          controller.enqueue(chunk);
+        }
+
+        // Process the raw event to rebuild semantic parts
+        const rawValue = chunk.rawValue;
+        if (!isRawEvent(rawValue)) return;
+
+        processRawEvent(rawValue, controller);
+        return;
+      }
+
+      // Suppress the inner model's semantic text/tool parts — we rebuild from raw
+      if (SUPPRESSED_INNER_TYPES.has(chunk.type)) {
+        return;
+      }
+
+      // Pass through everything else: finish, response-metadata, reasoning-*, source, error, stream-start, etc.
+      controller.enqueue(chunk);
+    },
+
+    flush(controller) {
+      // Close any still-open text parts (defensive — should not happen in normal flow)
+      for (const [key, text] of openTexts) {
+        if (text.started) {
+          controller.enqueue({ type: "text-end", id: key });
+        }
+      }
+      openTexts.clear();
+
+      // Finalize any still-open tool calls
+      for (const [, tool] of openTools) {
+        if (!tool.finalized) {
+          finalizeToolCall(tool, controller);
+        }
+      }
+      openTools.clear();
+    },
+  });
+
+  // -------------------------------------------
+  // Raw event processing
+  // -------------------------------------------
+
+  function processRawEvent(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    if (isOutputItemAdded(ev)) {
+      handleOutputItemAdded(ev, controller);
+    } else if (isTextDelta(ev)) {
+      handleTextDelta(ev, controller);
+    } else if (isFunctionCallArgsDelta(ev)) {
+      handleFunctionCallArgsDelta(ev, controller);
+    } else if (isOutputItemDone(ev)) {
+      handleOutputItemDone(ev, controller);
+    } else if (isResponseFailed(ev)) {
+      handleResponseFailed(ev, controller);
+    }
+    // response.created, response.completed, response.incomplete,
+    // response.reasoning_summary_*, response.output_text.annotation.*,
+    // etc. are either already handled by passthrough parts (finish,
+    // response-metadata, reasoning-*, source) or don't need semantic translation.
+  }
+
+  function handleOutputItemAdded(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const itemType = getItemType(ev);
+    const itemId = getItemId(ev);
+    if (!itemId) return;
+
+    if (itemType === "message") {
+      // A message item can have multiple content parts, but typically starts
+      // with index 0. We emit text-start eagerly here — the SDK does the same.
+      const key = `${itemId}:${getContentIndex(ev)}`;
+      openTexts.set(key, { itemId, started: true });
+      controller.enqueue({ type: "text-start", id: itemId });
+    } else if (itemType === "function_call") {
+      const item = ev.item as Record<string, unknown>;
+      const callId = typeof item.call_id === "string" ? item.call_id : itemId;
+      const toolName = typeof item.name === "string" ? item.name : "unknown";
+      const outputIndex = getOutputIndex(ev);
+
+      openTools.set(outputIndex, {
+        itemId,
+        callId,
+        toolName,
+        args: "",
+        started: true,
+        finalized: false,
+      });
+
+      controller.enqueue({
+        type: "tool-input-start",
+        id: callId,
+        toolName,
+      });
+    }
+  }
+
+  function handleTextDelta(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const itemId = typeof ev.item_id === "string" ? ev.item_id : undefined;
+    if (!itemId) return;
+
+    const contentIndex = getContentIndex(ev);
+    const key = `${itemId}:${contentIndex}`;
+
+    // Ensure text-start was emitted (defensive against out-of-order events)
+    if (!openTexts.has(key)) {
+      openTexts.set(key, { itemId, started: true });
+      controller.enqueue({ type: "text-start", id: itemId });
+    }
+
+    const delta = getDelta(ev);
+    if (delta.length > 0) {
+      controller.enqueue({ type: "text-delta", id: itemId, delta });
+    }
+  }
+
+  function handleFunctionCallArgsDelta(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const outputIndex = getOutputIndex(ev);
+    const tool = openTools.get(outputIndex);
+    if (!tool) return;
+
+    const delta = getDelta(ev);
+    tool.args += delta;
+
+    if (delta.length > 0) {
+      controller.enqueue({ type: "tool-input-delta", id: tool.callId, delta });
+    }
+  }
+
+  function handleOutputItemDone(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const itemType = getItemType(ev);
+    const itemId = getItemId(ev);
+    if (!itemId) return;
+
+    if (itemType === "message") {
+      // Close all text parts for this message item
+      for (const [key, text] of openTexts) {
+        if (text.itemId === itemId && text.started) {
+          controller.enqueue({ type: "text-end", id: itemId });
+          openTexts.delete(key);
+        }
+      }
+    } else if (itemType === "function_call") {
+      const outputIndex = getOutputIndex(ev);
+      const tool = openTools.get(outputIndex);
+      if (tool && !tool.finalized) {
+        // output_item.done for function_call contains the final arguments
+        const item = ev.item as Record<string, unknown>;
+        if (typeof item.arguments === "string") {
+          tool.args = item.arguments;
+        }
+        finalizeToolCall(tool, controller);
+        openTools.delete(outputIndex);
+      }
+    }
+  }
+
+  function finalizeToolCall(
+    tool: OpenToolCall,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    if (tool.finalized) return;
+    tool.finalized = true;
+
+    controller.enqueue({ type: "tool-input-end", id: tool.callId });
+    controller.enqueue({
+      type: "tool-call",
+      toolCallId: tool.callId,
+      toolName: tool.toolName,
+      input: tool.args,
+    });
+  }
+
+  function handleResponseFailed(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const response = ev.response as Record<string, unknown> | undefined;
+    const error = response?.error ?? ev.error ?? "Copilot Responses request failed";
+    controller.enqueue({ type: "error", error });
+  }
+}
+
+// ---------------------------------------------------------------------------
+// Public wrapper
+// ---------------------------------------------------------------------------
+
+/**
+ * Wrap a Responses-capable LanguageModelV3 for use with GitHub Copilot.
+ *
+ * The wrapper rebuilds coherent V3 text/tool stream parts from raw Responses
+ * events, compensating for ordering differences in Copilot's /v1/responses.
+ *
+ * - `doGenerate` is delegated unchanged.
+ * - `doStream` forces `includeRawChunks: true`, suppresses the inner model's
+ *   text/tool semantic parts, and rebuilds them from the raw events.
+ */
+export function wrapCopilotResponsesModel(inner: LanguageModelV3): LanguageModelV3 {
+  return {
+    specificationVersion: inner.specificationVersion,
+    provider: inner.provider,
+    modelId: inner.modelId,
+    supportedUrls: inner.supportedUrls,
+
+    doGenerate: (options: LanguageModelV3CallOptions) => inner.doGenerate(options),
+
+    async doStream(options: LanguageModelV3CallOptions): Promise<LanguageModelV3StreamResult> {
+      const outerWantsRaw = options.includeRawChunks === true;
+
+      // Force raw chunks so we can rebuild semantics from SSE events
+      const innerOptions: LanguageModelV3CallOptions = {
+        ...options,
+        includeRawChunks: true,
+      };
+
+      const result = await inner.doStream(innerOptions);
+
+      return {
+        ...result,
+        stream: result.stream.pipeThrough(createCopilotResponsesTransform(outerWantsRaw)),
+      };
+    },
+  };
+}
diff --git a/src/node/services/providerModelFactory.ts b/src/node/services/providerModelFactory.ts
index b7cadb1034..b077a0a93d 100644
--- a/src/node/services/providerModelFactory.ts
+++ b/src/node/services/providerModelFactory.ts
@@ -41,6 +41,7 @@ import {
   normalizeGatewayStreamUsage,
   normalizeGatewayGenerateResult,
 } from "@/node/utils/gatewayStreamNormalization";
+import { wrapCopilotResponsesModel } from "@/node/services/copilotResponsesModel";
 import { EnvHttpProxyAgent, type Dispatcher } from "undici";
 import packageJson from "../../../package.json";
 
@@ -1551,7 +1552,7 @@ export class ProviderModelFactory {
             apiKey: "copilot", // placeholder — actual auth via custom fetch
             fetch: providerFetch,
           });
-          return Ok(provider.responses(modelId));
+          return Ok(wrapCopilotResponsesModel(provider.responses(modelId)));
         }
 
         const { createOpenAICompatible } = await PROVIDER_REGISTRY["github-copilot"]();

From cfc1473bb79dc051c3f89d81647f85c6ca8d71ed Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 21:11:24 +0100
Subject: [PATCH 06/11] feat(copilot-responses): handle remaining lifecycle
 events from accepted plan
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Extend the Copilot Responses adapter to handle the raw lifecycle events
that were called out in the accepted plan but not covered in the initial
implementation:

Adapter (copilotResponsesModel.ts):
- response.content_part.added (output_text) → text-start + optional
  initial text-delta when part carries inline text
- response.output_text.done → reconcile trailing text if accumulated
  deltas are shorter than the final text
- response.content_part.done → text-end (so output_item.done becomes
  a fallback-only closer for text parts)
- response.function_call_arguments.done → reconcile args, then
  tool-input-end + tool-call (so output_item.done becomes a
  fallback-only finalizer for tool calls)
- Added accum field to OpenTextPart for delta reconciliation
- Added helper extractors: getPartType, getPartText, getText,
  getArguments

Tests (copilotResponsesModel.test.ts — 10 new tests):
- content_part lifecycle: multi-part text, initial text in
  content_part.added, non-output_text filtering
- output_text.done reconciliation: trailing text emission and no-op
  when text matches
- function_call_arguments.done: finalize-from-done making
  output_item.done a no-op, incomplete-delta reconciliation
- content_part.done closes before output_item.done (no double-close)
- Full plan lifecycle ordering: exact event sequence from the accepted
  plan that previously tripped 'text part <id> not found'

Factory tests (providerModelFactory.test.ts — 3 new tests):
- Spy-based assertions that wrapCopilotResponsesModel is invoked for
  responses-capable Copilot models (gpt-5.2)
- Not invoked for chat-only Copilot models (claude-sonnet-4)
- Not invoked when endpoint metadata is absent (gpt-4o)
---
 .../__tests__/copilotResponsesModel.test.ts   | 448 ++++++++++++++++++
 src/node/services/copilotResponsesModel.ts    | 166 ++++++-
 .../services/providerModelFactory.test.ts     |  77 ++-
 3 files changed, 687 insertions(+), 4 deletions(-)

diff --git a/src/node/services/__tests__/copilotResponsesModel.test.ts b/src/node/services/__tests__/copilotResponsesModel.test.ts
index 42fac1cb32..cbdaf93c9b 100644
--- a/src/node/services/__tests__/copilotResponsesModel.test.ts
+++ b/src/node/services/__tests__/copilotResponsesModel.test.ts
@@ -511,6 +511,454 @@ describe("wrapCopilotResponsesModel", () => {
     });
   });
 
+  describe("content_part lifecycle events", () => {
+    it("rebuilds text lifecycle from content_part.added / output_text.done / content_part.done", async () => {
+      const messageItemId = "msg_cp";
+      const stub = createStubModel([
+        // output_item.added for the message
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        // content_part.added with output_text type — should emit text-start
+        // (but output_item.added already started one at index 0, so this is
+        // for a second content part at index 1)
+        raw({
+          type: "response.content_part.added",
+          item_id: messageItemId,
+          content_index: 1,
+          part: { type: "output_text", text: "" },
+        }),
+        // Text deltas for second content part
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 1,
+          delta: "Hello",
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 1,
+          delta: " world",
+        }),
+        // output_text.done reconciliation
+        raw({
+          type: "response.output_text.done",
+          item_id: messageItemId,
+          content_index: 1,
+          text: "Hello world",
+        }),
+        // content_part.done closes the text part
+        raw({
+          type: "response.content_part.done",
+          item_id: messageItemId,
+          content_index: 1,
+          part: { type: "output_text", text: "Hello world" },
+        }),
+        // Close any remaining text from output_item
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 10, 5),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+
+      // First text-start from output_item.added (index 0), second from content_part.added (index 1)
+      expect(types).toEqual([
+        "text-start", // from output_item.added (message, content_index 0)
+        "text-start", // from content_part.added (output_text, content_index 1)
+        "text-delta", // "Hello"
+        "text-delta", // " world"
+        "text-end", // from content_part.done (content_index 1)
+        "text-end", // from output_item.done fallback (content_index 0)
+        "finish",
+      ]);
+
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas.map((d) => d.delta)).toEqual(["Hello", " world"]);
+    });
+
+    it("content_part.added emits text-start and initial delta when part carries text", async () => {
+      const messageItemId = "msg_cp_init";
+      const stub = createStubModel([
+        raw({
+          type: "response.content_part.added",
+          item_id: messageItemId,
+          content_index: 0,
+          part: { type: "output_text", text: "Initial" },
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: " more",
+        }),
+        raw({
+          type: "response.content_part.done",
+          item_id: messageItemId,
+          content_index: 0,
+          part: { type: "output_text", text: "Initial more" },
+        }),
+        finish("stop", 5, 3),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual([
+        "text-start", // from content_part.added
+        "text-delta", // "Initial" (initial text from content_part.added)
+        "text-delta", // " more" (from output_text.delta)
+        "text-end", // from content_part.done
+        "finish",
+      ]);
+
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas.map((d) => d.delta)).toEqual(["Initial", " more"]);
+    });
+
+    it("ignores content_part.added for non-output_text types", async () => {
+      const messageItemId = "msg_cp_other";
+      const stub = createStubModel([
+        // A content_part.added with an unsupported type should not trigger text-start
+        raw({
+          type: "response.content_part.added",
+          item_id: messageItemId,
+          content_index: 0,
+          part: { type: "refusal", refusal: "I cannot help with that" },
+        }),
+        finish("stop", 5, 1),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual(["finish"]);
+    });
+  });
+
+  describe("output_text.done reconciliation", () => {
+    it("emits trailing text delta when output_text.done has more text than accumulated deltas", async () => {
+      const messageItemId = "msg_reconcile";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Hello",
+        }),
+        // output_text.done has final text that includes trailing content not in deltas
+        raw({
+          type: "response.output_text.done",
+          item_id: messageItemId,
+          content_index: 0,
+          text: "Hello world",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 10, 5),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      expect(types).toEqual([
+        "text-start",
+        "text-delta", // "Hello" from delta
+        "text-delta", // " world" reconciled from output_text.done
+        "text-end", // from output_item.done fallback
+        "finish",
+      ]);
+
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas.map((d) => d.delta)).toEqual(["Hello", " world"]);
+    });
+
+    it("does not emit extra delta when output_text.done matches accumulated text", async () => {
+      const messageItemId = "msg_no_reconcile";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Hello world",
+        }),
+        // output_text.done matches exactly — no reconciliation needed
+        raw({
+          type: "response.output_text.done",
+          item_id: messageItemId,
+          content_index: 0,
+          text: "Hello world",
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 10, 5),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      // Only one text-delta — no extra reconciliation delta
+      expect(types).toEqual(["text-start", "text-delta", "text-end", "finish"]);
+
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas).toHaveLength(1);
+      expect(deltas[0].delta).toBe("Hello world");
+    });
+  });
+
+  describe("function_call_arguments.done lifecycle", () => {
+    it("finalizes tool call from arguments.done, making output_item.done a no-op", async () => {
+      const callId = "call_argsdone";
+      const toolName = "bash";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "fc_ad", type: "function_call", call_id: callId, name: toolName },
+          output_index: 0,
+        }),
+        raw({ type: "response.function_call_arguments.delta", output_index: 0, delta: '{"script' }),
+        raw({ type: "response.function_call_arguments.delta", output_index: 0, delta: '":"ls"}' }),
+        // function_call_arguments.done delivers final args and finalizes the tool
+        raw({
+          type: "response.function_call_arguments.done",
+          output_index: 0,
+          arguments: '{"script":"ls"}',
+        }),
+        // output_item.done should be a no-op since args-done already finalized
+        raw({
+          type: "response.output_item.done",
+          item: {
+            id: "fc_ad",
+            type: "function_call",
+            call_id: callId,
+            name: toolName,
+            arguments: '{"script":"ls"}',
+          },
+          output_index: 0,
+        }),
+        finish("tool-calls", 20, 10),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      // Only one tool-input-end and one tool-call — not doubled by output_item.done
+      expect(types).toEqual([
+        "tool-input-start",
+        "tool-input-delta",
+        "tool-input-delta",
+        "tool-input-end",
+        "tool-call",
+        "finish",
+      ]);
+
+      const toolCall = parts.find((p) => p.type === "tool-call") as {
+        type: "tool-call";
+        toolCallId: string;
+        toolName: string;
+        input: string;
+      };
+      expect(toolCall.toolCallId).toBe(callId);
+      expect(toolCall.toolName).toBe(toolName);
+      expect(toolCall.input).toBe('{"script":"ls"}');
+    });
+
+    it("reconciles arguments from done event when deltas were incomplete", async () => {
+      const callId = "call_reconcile_args";
+      const toolName = "file_read";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: "fc_ra", type: "function_call", call_id: callId, name: toolName },
+          output_index: 0,
+        }),
+        // Only partial arguments via delta
+        raw({ type: "response.function_call_arguments.delta", output_index: 0, delta: '{"path":' }),
+        // Done event carries the full arguments
+        raw({
+          type: "response.function_call_arguments.done",
+          output_index: 0,
+          arguments: '{"path":"src/test.ts"}',
+        }),
+        finish("tool-calls", 10, 5),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const toolCall = parts.find((p) => p.type === "tool-call") as {
+        type: "tool-call";
+        input: string;
+      };
+      // Final input should be from the done event, not the incomplete deltas
+      expect(toolCall.input).toBe('{"path":"src/test.ts"}');
+    });
+  });
+
+  describe("content_part.done closes text before output_item.done", () => {
+    it("content_part.done emits text-end so output_item.done does not double-close", async () => {
+      const messageItemId = "msg_cp_first";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Hi",
+        }),
+        // content_part.done closes the text part
+        raw({
+          type: "response.content_part.done",
+          item_id: messageItemId,
+          content_index: 0,
+          part: { type: "output_text", text: "Hi" },
+        }),
+        // output_item.done should not double-close
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 5, 2),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      // Exactly one text-end, not two
+      expect(types).toEqual(["text-start", "text-delta", "text-end", "finish"]);
+    });
+  });
+
+  describe("full plan lifecycle ordering", () => {
+    it("handles the complete content_part event sequence from the plan", async () => {
+      // Simulates the exact sequence from the accepted plan:
+      // content_part.added → output_text.delta → output_text.done → content_part.done → output_item.done
+      // This is the ordering that would previously trip "text part <id> not found".
+      const messageItemId = "msg_plan";
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.content_part.added",
+          item_id: messageItemId,
+          content_index: 0,
+          part: { type: "output_text", text: "" },
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Test ",
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "output",
+        }),
+        raw({
+          type: "response.output_text.done",
+          item_id: messageItemId,
+          content_index: 0,
+          text: "Test output",
+        }),
+        raw({
+          type: "response.content_part.done",
+          item_id: messageItemId,
+          content_index: 0,
+          part: { type: "output_text", text: "Test output" },
+        }),
+        raw({
+          type: "response.output_item.done",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        finish("stop", 15, 8),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      const types = parts.map((p) => p.type);
+      // output_item.added emits text-start for index 0,
+      // content_part.added sees key already exists so does NOT emit duplicate text-start,
+      // deltas emit text-delta, output_text.done is a no-op (matches accumulated),
+      // content_part.done emits text-end, output_item.done is a no-op (already closed)
+      expect(types).toEqual([
+        "text-start",
+        "text-delta", // "Test "
+        "text-delta", // "output"
+        "text-end",
+        "finish",
+      ]);
+
+      const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        delta: string;
+      }>;
+      expect(deltas.map((d) => d.delta)).toEqual(["Test ", "output"]);
+    });
+  });
   describe("mixed text and tool calls", () => {
     it("handles interleaved text and tool call events", async () => {
       const msgId = "msg_mixed";
diff --git a/src/node/services/copilotResponsesModel.ts b/src/node/services/copilotResponsesModel.ts
index 3485387303..67be9ac61b 100644
--- a/src/node/services/copilotResponsesModel.ts
+++ b/src/node/services/copilotResponsesModel.ts
@@ -64,6 +64,26 @@ function isFunctionCallArgsDelta(ev: RawResponsesEvent): boolean {
   return ev.type === "response.function_call_arguments.delta";
 }
 
+// response.content_part.added
+function isContentPartAdded(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.content_part.added";
+}
+
+// response.content_part.done
+function isContentPartDone(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.content_part.done";
+}
+
+// response.output_text.done
+function isTextDone(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.output_text.done";
+}
+
+// response.function_call_arguments.done
+function isFunctionCallArgsDone(ev: RawResponsesEvent): boolean {
+  return ev.type === "response.function_call_arguments.done";
+}
+
 // response.failed
 function isResponseFailed(ev: RawResponsesEvent): boolean {
   return ev.type === "response.failed";
@@ -98,6 +118,24 @@ function getDelta(ev: RawResponsesEvent): string {
   return typeof ev.delta === "string" ? ev.delta : "";
 }
 
+function getPartType(ev: RawResponsesEvent): string | undefined {
+  const part = ev.part as Record<string, unknown> | undefined;
+  return part && typeof part.type === "string" ? part.type : undefined;
+}
+
+function getPartText(ev: RawResponsesEvent): string | undefined {
+  const part = ev.part as Record<string, unknown> | undefined;
+  return part && typeof part.text === "string" ? part.text : undefined;
+}
+
+function getText(ev: RawResponsesEvent): string | undefined {
+  return typeof ev.text === "string" ? ev.text : undefined;
+}
+
+function getArguments(ev: RawResponsesEvent): string | undefined {
+  return typeof ev.arguments === "string" ? ev.arguments : undefined;
+}
+
 // ---------------------------------------------------------------------------
 // Semantic part types suppressed from the inner stream
 // ---------------------------------------------------------------------------
@@ -120,6 +158,8 @@ const SUPPRESSED_INNER_TYPES = new Set<string>([
 interface OpenTextPart {
   itemId: string;
   started: boolean;
+  /** Accumulated text from deltas, used for reconciliation in output_text.done. */
+  accum: string;
 }
 
 interface OpenToolCall {
@@ -197,10 +237,18 @@ function createCopilotResponsesTransform(
   ): void {
     if (isOutputItemAdded(ev)) {
       handleOutputItemAdded(ev, controller);
+    } else if (isContentPartAdded(ev)) {
+      handleContentPartAdded(ev, controller);
     } else if (isTextDelta(ev)) {
       handleTextDelta(ev, controller);
+    } else if (isTextDone(ev)) {
+      handleTextDone(ev, controller);
+    } else if (isContentPartDone(ev)) {
+      handleContentPartDone(ev, controller);
     } else if (isFunctionCallArgsDelta(ev)) {
       handleFunctionCallArgsDelta(ev, controller);
+    } else if (isFunctionCallArgsDone(ev)) {
+      handleFunctionCallArgsDone(ev, controller);
     } else if (isOutputItemDone(ev)) {
       handleOutputItemDone(ev, controller);
     } else if (isResponseFailed(ev)) {
@@ -224,7 +272,7 @@ function createCopilotResponsesTransform(
       // A message item can have multiple content parts, but typically starts
       // with index 0. We emit text-start eagerly here — the SDK does the same.
       const key = `${itemId}:${getContentIndex(ev)}`;
-      openTexts.set(key, { itemId, started: true });
+      openTexts.set(key, { itemId, started: true, accum: "" });
       controller.enqueue({ type: "text-start", id: itemId });
     } else if (itemType === "function_call") {
       const item = ev.item as Record<string, unknown>;
@@ -261,16 +309,96 @@ function createCopilotResponsesTransform(
 
     // Ensure text-start was emitted (defensive against out-of-order events)
     if (!openTexts.has(key)) {
-      openTexts.set(key, { itemId, started: true });
+      openTexts.set(key, { itemId, started: true, accum: "" });
       controller.enqueue({ type: "text-start", id: itemId });
     }
 
     const delta = getDelta(ev);
     if (delta.length > 0) {
+      const text = openTexts.get(key)!;
+      text.accum += delta;
       controller.enqueue({ type: "text-delta", id: itemId, delta });
     }
   }
 
+  /**
+   * response.content_part.added — emitted when a new content part (e.g., output_text)
+   * is added to a message item. Triggers text-start if not already started, plus an
+   * optional initial text-delta if the part carries inline text.
+   */
+  function handleContentPartAdded(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const itemId = typeof ev.item_id === "string" ? ev.item_id : undefined;
+    if (!itemId) return;
+
+    const partType = getPartType(ev);
+    // Only handle output_text content parts
+    if (partType !== "output_text") return;
+
+    const contentIndex = getContentIndex(ev);
+    const key = `${itemId}:${contentIndex}`;
+
+    if (!openTexts.has(key)) {
+      openTexts.set(key, { itemId, started: true, accum: "" });
+      controller.enqueue({ type: "text-start", id: itemId });
+    }
+
+    // Some servers include initial text inline in the content_part.added event
+    const initialText = getPartText(ev);
+    if (initialText && initialText.length > 0) {
+      const text = openTexts.get(key)!;
+      text.accum += initialText;
+      controller.enqueue({ type: "text-delta", id: itemId, delta: initialText });
+    }
+  }
+
+  /**
+   * response.output_text.done — emitted when the full text for a content part
+   * is finalized. Reconciles any trailing text that was not delivered via deltas.
+   */
+  function handleTextDone(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const itemId = typeof ev.item_id === "string" ? ev.item_id : undefined;
+    if (!itemId) return;
+
+    const contentIndex = getContentIndex(ev);
+    const key = `${itemId}:${contentIndex}`;
+    const finalText = getText(ev);
+
+    const text = openTexts.get(key);
+    if (text && finalText != null && finalText.length > text.accum.length) {
+      // Emit any trailing text that the deltas missed
+      const trailing = finalText.slice(text.accum.length);
+      text.accum = finalText;
+      controller.enqueue({ type: "text-delta", id: itemId, delta: trailing });
+    }
+  }
+
+  /**
+   * response.content_part.done — emitted when a content part is fully done.
+   * Closes the text part with text-end.
+   */
+  function handleContentPartDone(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const itemId = typeof ev.item_id === "string" ? ev.item_id : undefined;
+    if (!itemId) return;
+
+    const contentIndex = getContentIndex(ev);
+    const key = `${itemId}:${contentIndex}`;
+
+    const text = openTexts.get(key);
+    if (text && text.started) {
+      controller.enqueue({ type: "text-end", id: itemId });
+      openTexts.delete(key);
+    }
+  }
+
   function handleFunctionCallArgsDelta(
     ev: RawResponsesEvent,
     controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
@@ -287,6 +415,37 @@ function createCopilotResponsesTransform(
     }
   }
 
+  /**
+   * response.function_call_arguments.done — emitted when the final arguments
+   * for a function call are available. Reconciles accumulated args and finalizes
+   * the tool call (tool-input-end + tool-call), so output_item.done becomes
+   * a no-op fallback for this tool.
+   */
+  function handleFunctionCallArgsDone(
+    ev: RawResponsesEvent,
+    controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
+  ): void {
+    const outputIndex = getOutputIndex(ev);
+    const tool = openTools.get(outputIndex);
+    if (!tool || tool.finalized) return;
+
+    // Reconcile final arguments from the done event
+    const finalArgs = getArguments(ev);
+    if (finalArgs != null) {
+      tool.args = finalArgs;
+    }
+
+    finalizeToolCall(tool, controller);
+    openTools.delete(outputIndex);
+  }
+
+  /**
+   * response.output_item.done — fallback finalization.
+   * For message items: closes any still-open text parts that content_part.done did not
+   * already close (e.g., when the server omits content_part events).
+   * For function_call items: finalizes only if function_call_arguments.done was not
+   * received (the tool will already be deleted from openTools if args-done ran).
+   */
   function handleOutputItemDone(
     ev: RawResponsesEvent,
     controller: TransformStreamDefaultController<LanguageModelV3StreamPart>
@@ -296,7 +455,7 @@ function createCopilotResponsesTransform(
     if (!itemId) return;
 
     if (itemType === "message") {
-      // Close all text parts for this message item
+      // Fallback: close any text parts that content_part.done did not already close
       for (const [key, text] of openTexts) {
         if (text.itemId === itemId && text.started) {
           controller.enqueue({ type: "text-end", id: itemId });
@@ -304,6 +463,7 @@ function createCopilotResponsesTransform(
         }
       }
     } else if (itemType === "function_call") {
+      // Fallback: finalize only if function_call_arguments.done did not already do so
       const outputIndex = getOutputIndex(ev);
       const tool = openTools.get(outputIndex);
       if (tool && !tool.finalized) {
diff --git a/src/node/services/providerModelFactory.test.ts b/src/node/services/providerModelFactory.test.ts
index 216d0c0fed..a1a1f44481 100644
--- a/src/node/services/providerModelFactory.test.ts
+++ b/src/node/services/providerModelFactory.test.ts
@@ -1,4 +1,4 @@
-import { describe, expect, it } from "bun:test";
+import { describe, expect, it, spyOn } from "bun:test";
 import * as fs from "fs";
 import * as os from "os";
 import * as path from "path";
@@ -13,6 +13,7 @@ import {
   resolveAIProviderHeaderSource,
 } from "./providerModelFactory";
 import { ProviderService } from "./providerService";
+import * as copilotResponsesModule from "./copilotResponsesModel";
 
 async function withTempConfig(
   run: (config: Config, factory: ProviderModelFactory) => Promise<void> | void
@@ -549,6 +550,80 @@ describe("ProviderModelFactory Copilot endpoint selection", () => {
   });
 });
 
+describe("ProviderModelFactory Copilot wrapper invocation", () => {
+  it("invokes wrapCopilotResponsesModel for a responses-capable Copilot model", async () => {
+    const wrapSpy = spyOn(copilotResponsesModule, "wrapCopilotResponsesModel");
+    try {
+      await withTempConfig(async (config, factory) => {
+        config.saveProvidersConfig({
+          "github-copilot": {
+            apiKey: "ghu_test",
+          },
+        });
+
+        wrapSpy.mockClear();
+
+        // gpt-5.2 has Copilot-scoped metadata with /v1/responses support
+        const result = await factory.createModel("github-copilot:gpt-5.2");
+        expect(result.success).toBe(true);
+
+        // The wrapper must have been called exactly once for the responses branch
+        expect(wrapSpy).toHaveBeenCalledTimes(1);
+      });
+    } finally {
+      wrapSpy.mockRestore();
+    }
+  });
+
+  it("does not invoke wrapCopilotResponsesModel for a chat-only Copilot model", async () => {
+    const wrapSpy = spyOn(copilotResponsesModule, "wrapCopilotResponsesModel");
+    try {
+      await withTempConfig(async (config, factory) => {
+        config.saveProvidersConfig({
+          "github-copilot": {
+            apiKey: "ghu_test",
+          },
+        });
+
+        wrapSpy.mockClear();
+
+        // claude-sonnet-4 has supported_endpoints: ["/v1/chat/completions"] only
+        const result = await factory.createModel("github-copilot:claude-sonnet-4");
+        expect(result.success).toBe(true);
+
+        // The wrapper should NOT be called for chat-only models
+        expect(wrapSpy).not.toHaveBeenCalled();
+      });
+    } finally {
+      wrapSpy.mockRestore();
+    }
+  });
+
+  it("does not invoke wrapCopilotResponsesModel when endpoint metadata is absent", async () => {
+    const wrapSpy = spyOn(copilotResponsesModule, "wrapCopilotResponsesModel");
+    try {
+      await withTempConfig(async (config, factory) => {
+        config.saveProvidersConfig({
+          "github-copilot": {
+            apiKey: "ghu_test",
+          },
+        });
+
+        wrapSpy.mockClear();
+
+        // gpt-4o has no supported_endpoints metadata — should fall back to chat
+        const result = await factory.createModel("github-copilot:gpt-4o");
+        expect(result.success).toBe(true);
+
+        // No wrapper invocation for metadata-missing models
+        expect(wrapSpy).not.toHaveBeenCalled();
+      });
+    } finally {
+      wrapSpy.mockRestore();
+    }
+  });
+});
+
 describe("classifyCopilotInitiator", () => {
   it("returns 'user' when last message role is user", () => {
     const body = JSON.stringify({ messages: [{ role: "user", content: "hello" }] });

From 8cdb250bb6bdb664ef70b62a571e24e8082d1d5c Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 21:13:29 +0100
Subject: [PATCH 07/11] fix: use optional chaining in copilotResponsesModel
 (prefer-optional-chain)

---
 src/node/services/copilotResponsesModel.ts | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/src/node/services/copilotResponsesModel.ts b/src/node/services/copilotResponsesModel.ts
index 67be9ac61b..96141ad1d9 100644
--- a/src/node/services/copilotResponsesModel.ts
+++ b/src/node/services/copilotResponsesModel.ts
@@ -393,7 +393,7 @@ function createCopilotResponsesTransform(
     const key = `${itemId}:${contentIndex}`;
 
     const text = openTexts.get(key);
-    if (text && text.started) {
+    if (text?.started) {
       controller.enqueue({ type: "text-end", id: itemId });
       openTexts.delete(key);
     }

From 772ab914d11ca1883adffbbb2b0b6ed0853356ad Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 21:32:32 +0100
Subject: [PATCH 08/11] fix(copilot): use external itemId in flush() text-end,
 not internal map key

The flush() fallback in the Copilot Responses transform was emitting
text-end with the internal tracking key (`${itemId}:${contentIndex}`)
instead of the external itemId used by text-start. This caused
'text part <id>:0 not found' errors when a stream ended with an
open text part (no content_part.done / output_item.done received).

Fix: use `text.itemId` (the stored external id) instead of the
map key in the flush loop.

Add regression test that simulates a stream ending after
output_item.added + text delta + finish (without content_part.done
or output_item.done), and asserts the flush-emitted text-end id
matches the original external itemId.
---
 .../__tests__/copilotResponsesModel.test.ts   | 59 +++++++++++++++++++
 src/node/services/copilotResponsesModel.ts    |  8 ++-
 2 files changed, 64 insertions(+), 3 deletions(-)

diff --git a/src/node/services/__tests__/copilotResponsesModel.test.ts b/src/node/services/__tests__/copilotResponsesModel.test.ts
index cbdaf93c9b..ac24aad7fc 100644
--- a/src/node/services/__tests__/copilotResponsesModel.test.ts
+++ b/src/node/services/__tests__/copilotResponsesModel.test.ts
@@ -206,6 +206,65 @@ describe("wrapCopilotResponsesModel", () => {
       expect(deltas.map((d) => d.delta)).toContain("Early");
       expect(deltas.map((d) => d.delta)).toContain(" text");
     });
+
+    // Regression: flush() used to emit text-end with the internal map key
+    // (`${itemId}:${contentIndex}`) instead of the external itemId, producing
+    // "text part <id>:0 not found" errors when the stream ended with an
+    // open text part (no content_part.done / output_item.done received).
+    it("flush emits text-end with the external itemId, not the internal key", async () => {
+      const messageItemId = "msg_flush_regression";
+      // Stream that opens a text part but never closes it — no content_part.done
+      // or output_item.done, just a finish event followed by stream close.
+      const stub = createStubModel([
+        raw({
+          type: "response.output_item.added",
+          item: { id: messageItemId, type: "message" },
+          output_index: 0,
+        }),
+        raw({
+          type: "response.output_text.delta",
+          item_id: messageItemId,
+          content_index: 0,
+          delta: "Hello world",
+        }),
+        // Stream ends here — no content_part.done, no output_item.done.
+        finish("stop", 10, 5),
+      ]);
+
+      const wrapped = wrapCopilotResponsesModel(stub);
+      const result = await wrapped.doStream(baseOptions);
+      const parts = await collectStream(result.stream);
+
+      // The flush fallback must close the open text part.
+      const textEnds = parts.filter((p) => p.type === "text-end") as Array<{
+        type: "text-end";
+        id: string;
+      }>;
+      expect(textEnds).toHaveLength(1);
+
+      // Critical assertion: the id must be the external itemId, not
+      // the internal tracking key "${messageItemId}:0".
+      expect(textEnds[0]!.id).toBe(messageItemId);
+      expect(textEnds[0]!.id).not.toBe(`${messageItemId}:0`);
+
+      // Verify the full lifecycle is coherent: text-start, text-delta, text-end
+      // all use the same external id.
+      const textStarts = parts.filter((p) => p.type === "text-start") as Array<{
+        type: "text-start";
+        id: string;
+      }>;
+      expect(textStarts).toHaveLength(1);
+      expect(textStarts[0]!.id).toBe(messageItemId);
+
+      const textDeltas = parts.filter((p) => p.type === "text-delta") as Array<{
+        type: "text-delta";
+        id: string;
+        delta: string;
+      }>;
+      expect(textDeltas).toHaveLength(1);
+      expect(textDeltas[0]!.id).toBe(messageItemId);
+      expect(textDeltas[0]!.delta).toBe("Hello world");
+    });
   });
 
   describe("inner semantic part suppression", () => {
diff --git a/src/node/services/copilotResponsesModel.ts b/src/node/services/copilotResponsesModel.ts
index 96141ad1d9..a0a24e0a6b 100644
--- a/src/node/services/copilotResponsesModel.ts
+++ b/src/node/services/copilotResponsesModel.ts
@@ -209,10 +209,12 @@ function createCopilotResponsesTransform(
     },
 
     flush(controller) {
-      // Close any still-open text parts (defensive — should not happen in normal flow)
-      for (const [key, text] of openTexts) {
+      // Close any still-open text parts (defensive — should not happen in normal flow).
+      // Use text.itemId (the external id from text-start), NOT the internal map key
+      // which has the format `${itemId}:${contentIndex}`.
+      for (const [, text] of openTexts) {
         if (text.started) {
-          controller.enqueue({ type: "text-end", id: key });
+          controller.enqueue({ type: "text-end", id: text.itemId });
         }
       }
       openTexts.clear();

From 8438b53c732569663b8e6f3b0e0a59ba90bf510a Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 21:34:54 +0100
Subject: [PATCH 09/11] fix: remove unnecessary non-null assertions in
 copilotResponsesModel test

The `as Array<...>` casts already narrow the element type, making the
`!.` postfix assertions redundant. ESLint's
@typescript-eslint/no-unnecessary-type-assertion flagged 5 occurrences.
---
 .../services/__tests__/copilotResponsesModel.test.ts   | 10 +++++-----
 1 file changed, 5 insertions(+), 5 deletions(-)

diff --git a/src/node/services/__tests__/copilotResponsesModel.test.ts b/src/node/services/__tests__/copilotResponsesModel.test.ts
index ac24aad7fc..1064b90c04 100644
--- a/src/node/services/__tests__/copilotResponsesModel.test.ts
+++ b/src/node/services/__tests__/copilotResponsesModel.test.ts
@@ -244,8 +244,8 @@ describe("wrapCopilotResponsesModel", () => {
 
       // Critical assertion: the id must be the external itemId, not
       // the internal tracking key "${messageItemId}:0".
-      expect(textEnds[0]!.id).toBe(messageItemId);
-      expect(textEnds[0]!.id).not.toBe(`${messageItemId}:0`);
+      expect(textEnds[0].id).toBe(messageItemId);
+      expect(textEnds[0].id).not.toBe(`${messageItemId}:0`);
 
       // Verify the full lifecycle is coherent: text-start, text-delta, text-end
       // all use the same external id.
@@ -254,7 +254,7 @@ describe("wrapCopilotResponsesModel", () => {
         id: string;
       }>;
       expect(textStarts).toHaveLength(1);
-      expect(textStarts[0]!.id).toBe(messageItemId);
+      expect(textStarts[0].id).toBe(messageItemId);
 
       const textDeltas = parts.filter((p) => p.type === "text-delta") as Array<{
         type: "text-delta";
@@ -262,8 +262,8 @@ describe("wrapCopilotResponsesModel", () => {
         delta: string;
       }>;
       expect(textDeltas).toHaveLength(1);
-      expect(textDeltas[0]!.id).toBe(messageItemId);
-      expect(textDeltas[0]!.delta).toBe("Hello world");
+      expect(textDeltas[0].id).toBe(messageItemId);
+      expect(textDeltas[0].delta).toBe("Hello world");
     });
   });
 

From bd94b30e34f60b4f7a443d8b6bc7a61a58ed6447 Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Sun, 15 Mar 2026 23:42:13 +0100
Subject: [PATCH 10/11] fix: address review findings on Copilot Responses
 adapter

- Fix P1 regression: getModelCapabilities now merges across all matching
  lookup keys instead of returning on first match. Provider-scoped entries
  still take priority, but bare-model entries fill in missing capabilities
  (e.g. supports_pdf_input for github-copilot:gpt-4o).
  getSupportedEndpoints keeps first-match-wins since endpoint restrictions
  must not be diluted by bare-model data.

- Fix P2: text stream parts now use composite id (itemId:contentIndex)
  instead of bare itemId. Each content part gets a unique identity so
  DevTools middleware can track them independently without overwrites.

- Fix P3: clarify getSupportedEndpoints docstring to cover both "no
  metadata" and "metadata lacks endpoint info" null cases.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 src/common/utils/ai/modelCapabilities.test.ts |  9 +++++
 src/common/utils/ai/modelCapabilities.ts      | 25 +++++++++-----
 .../__tests__/copilotResponsesModel.test.ts   | 34 ++++++++++++-------
 src/node/services/copilotResponsesModel.ts    | 34 ++++++++++---------
 4 files changed, 65 insertions(+), 37 deletions(-)

diff --git a/src/common/utils/ai/modelCapabilities.test.ts b/src/common/utils/ai/modelCapabilities.test.ts
index 2eb3c92e3a..d665ae7c92 100644
--- a/src/common/utils/ai/modelCapabilities.test.ts
+++ b/src/common/utils/ai/modelCapabilities.test.ts
@@ -56,6 +56,15 @@ describe("getModelCapabilities", () => {
   it("returns null for unknown models", () => {
     expect(getModelCapabilities("anthropic:this-model-does-not-exist")).toBeNull();
   });
+
+  it("inherits bare-model capabilities when provider-scoped entry omits them", () => {
+    // github_copilot/gpt-4o in models.json lacks supports_pdf_input,
+    // but bare gpt-4o has it. The merge-across-keys strategy must fill
+    // in the missing field from the bare model.
+    const caps = getModelCapabilities("github-copilot:gpt-4o");
+    expect(caps).not.toBeNull();
+    expect(caps?.supportsPdfInput).toBe(true);
+  });
 });
 
 describe("getSupportedInputMediaTypes", () => {
diff --git a/src/common/utils/ai/modelCapabilities.ts b/src/common/utils/ai/modelCapabilities.ts
index 24e9bcb11d..f919a5cfa6 100644
--- a/src/common/utils/ai/modelCapabilities.ts
+++ b/src/common/utils/ai/modelCapabilities.ts
@@ -95,20 +95,29 @@ export function getModelCapabilities(modelString: string): ModelCapabilities | n
   const modelsExtraRecord = modelsExtra as unknown as Record<string, RawModelCapabilitiesData>;
   const modelsDataRecord = modelsData as unknown as Record<string, RawModelCapabilitiesData>;
 
-  // Merge models.json (upstream) + models-extra.ts (local overrides). Extras win.
-  // This avoids wiping capabilities (e.g. PDF support) when modelsExtra only overrides
-  // pricing/token limits.
+  // Merge across ALL matching lookup keys so provider-scoped entries (first
+  // in lookup order) override specific fields while bare-model entries fill
+  // in capabilities the provider-scoped entry omits (e.g. github_copilot/gpt-4o
+  // lacks supports_pdf_input but bare gpt-4o has it).
+  // Within each key, modelsExtra wins over modelsData (upstream).
+  let merged: RawModelCapabilitiesData | null = null;
   for (const key of lookupKeys) {
     const base = modelsDataRecord[key];
     const extra = modelsExtraRecord[key];
 
     if (base || extra) {
-      const merged: RawModelCapabilitiesData = { ...(base ?? {}), ...(extra ?? {}) };
-      return extractModelCapabilities(merged);
+      const keyData: RawModelCapabilitiesData = Object.assign({}, base ?? {}, extra ?? {});
+      if (merged != null) {
+        // Earlier keys (provider-scoped) take priority; later keys (bare model)
+        // fill gaps but don't override.
+        merged = Object.assign({}, keyData, merged);
+      } else {
+        merged = keyData;
+      }
     }
   }
 
-  return null;
+  return merged ? extractModelCapabilities(merged) : null;
 }
 
 export function getModelCapabilitiesResolved(
@@ -137,8 +146,8 @@ export function getSupportedInputMediaTypes(
  * Resolve supported API endpoints for a model string from static metadata.
  *
  * Returns the `supported_endpoints` array (e.g. `["/v1/responses"]`) when
- * found in models-extra or models.json, or `null` when no metadata exists.
- * Follows the same lookup-key + merge strategy as `getModelCapabilities`.
+ * found in models-extra or models.json, or `null` when no metadata exists
+ * or the metadata lacks endpoint information.
  */
 export function getSupportedEndpoints(modelString: string): string[] | null {
   const normalized = normalizeToCanonical(modelString);
diff --git a/src/node/services/__tests__/copilotResponsesModel.test.ts b/src/node/services/__tests__/copilotResponsesModel.test.ts
index 1064b90c04..68de7beef5 100644
--- a/src/node/services/__tests__/copilotResponsesModel.test.ts
+++ b/src/node/services/__tests__/copilotResponsesModel.test.ts
@@ -207,12 +207,11 @@ describe("wrapCopilotResponsesModel", () => {
       expect(deltas.map((d) => d.delta)).toContain(" text");
     });
 
-    // Regression: flush() used to emit text-end with the internal map key
-    // (`${itemId}:${contentIndex}`) instead of the external itemId, producing
-    // "text part <id>:0 not found" errors when the stream ended with an
-    // open text part (no content_part.done / output_item.done received).
-    it("flush emits text-end with the external itemId, not the internal key", async () => {
+    // Regression: flush() must emit text-end with the same composite id used
+    // by text-start, so downstream consumers (e.g. DevTools) can match them.
+    it("flush emits text-end with the same composite id as text-start", async () => {
       const messageItemId = "msg_flush_regression";
+      const expectedId = `${messageItemId}:0`;
       // Stream that opens a text part but never closes it — no content_part.done
       // or output_item.done, just a finish event followed by stream close.
       const stub = createStubModel([
@@ -241,20 +240,16 @@ describe("wrapCopilotResponsesModel", () => {
         id: string;
       }>;
       expect(textEnds).toHaveLength(1);
-
-      // Critical assertion: the id must be the external itemId, not
-      // the internal tracking key "${messageItemId}:0".
-      expect(textEnds[0].id).toBe(messageItemId);
-      expect(textEnds[0].id).not.toBe(`${messageItemId}:0`);
+      expect(textEnds[0].id).toBe(expectedId);
 
       // Verify the full lifecycle is coherent: text-start, text-delta, text-end
-      // all use the same external id.
+      // all use the same composite id.
       const textStarts = parts.filter((p) => p.type === "text-start") as Array<{
         type: "text-start";
         id: string;
       }>;
       expect(textStarts).toHaveLength(1);
-      expect(textStarts[0].id).toBe(messageItemId);
+      expect(textStarts[0].id).toBe(expectedId);
 
       const textDeltas = parts.filter((p) => p.type === "text-delta") as Array<{
         type: "text-delta";
@@ -262,7 +257,7 @@ describe("wrapCopilotResponsesModel", () => {
         delta: string;
       }>;
       expect(textDeltas).toHaveLength(1);
-      expect(textDeltas[0].id).toBe(messageItemId);
+      expect(textDeltas[0].id).toBe(expectedId);
       expect(textDeltas[0].delta).toBe("Hello world");
     });
   });
@@ -642,11 +637,24 @@ describe("wrapCopilotResponsesModel", () => {
         "finish",
       ]);
 
+      // Each content index gets a unique composite id so downstream consumers
+      // (e.g. DevTools) can track them independently.
+      const textStarts = parts.filter((p) => p.type === "text-start") as Array<{
+        type: "text-start";
+        id: string;
+      }>;
+      expect(textStarts[0].id).toBe(`${messageItemId}:0`);
+      expect(textStarts[1].id).toBe(`${messageItemId}:1`);
+
       const deltas = parts.filter((p) => p.type === "text-delta") as Array<{
         type: "text-delta";
+        id: string;
         delta: string;
       }>;
       expect(deltas.map((d) => d.delta)).toEqual(["Hello", " world"]);
+      // Deltas for content_index 1
+      expect(deltas[0].id).toBe(`${messageItemId}:1`);
+      expect(deltas[1].id).toBe(`${messageItemId}:1`);
     });
 
     it("content_part.added emits text-start and initial delta when part carries text", async () => {
diff --git a/src/node/services/copilotResponsesModel.ts b/src/node/services/copilotResponsesModel.ts
index a0a24e0a6b..139c9d82f4 100644
--- a/src/node/services/copilotResponsesModel.ts
+++ b/src/node/services/copilotResponsesModel.ts
@@ -156,7 +156,8 @@ const SUPPRESSED_INNER_TYPES = new Set<string>([
 // ---------------------------------------------------------------------------
 
 interface OpenTextPart {
-  itemId: string;
+  /** Composite id emitted on text-start/delta/end (`${itemId}:${contentIndex}`). */
+  externalId: string;
   started: boolean;
   /** Accumulated text from deltas, used for reconciliation in output_text.done. */
   accum: string;
@@ -210,11 +211,9 @@ function createCopilotResponsesTransform(
 
     flush(controller) {
       // Close any still-open text parts (defensive — should not happen in normal flow).
-      // Use text.itemId (the external id from text-start), NOT the internal map key
-      // which has the format `${itemId}:${contentIndex}`.
       for (const [, text] of openTexts) {
         if (text.started) {
-          controller.enqueue({ type: "text-end", id: text.itemId });
+          controller.enqueue({ type: "text-end", id: text.externalId });
         }
       }
       openTexts.clear();
@@ -273,9 +272,12 @@ function createCopilotResponsesTransform(
     if (itemType === "message") {
       // A message item can have multiple content parts, but typically starts
       // with index 0. We emit text-start eagerly here — the SDK does the same.
+      // Use composite key as the external id so each content part gets a
+      // unique identity (prevents DevTools from overwriting accumulated text
+      // when multiple content indices share the same itemId).
       const key = `${itemId}:${getContentIndex(ev)}`;
-      openTexts.set(key, { itemId, started: true, accum: "" });
-      controller.enqueue({ type: "text-start", id: itemId });
+      openTexts.set(key, { externalId: key, started: true, accum: "" });
+      controller.enqueue({ type: "text-start", id: key });
     } else if (itemType === "function_call") {
       const item = ev.item as Record<string, unknown>;
       const callId = typeof item.call_id === "string" ? item.call_id : itemId;
@@ -311,15 +313,15 @@ function createCopilotResponsesTransform(
 
     // Ensure text-start was emitted (defensive against out-of-order events)
     if (!openTexts.has(key)) {
-      openTexts.set(key, { itemId, started: true, accum: "" });
-      controller.enqueue({ type: "text-start", id: itemId });
+      openTexts.set(key, { externalId: key, started: true, accum: "" });
+      controller.enqueue({ type: "text-start", id: key });
     }
 
     const delta = getDelta(ev);
     if (delta.length > 0) {
       const text = openTexts.get(key)!;
       text.accum += delta;
-      controller.enqueue({ type: "text-delta", id: itemId, delta });
+      controller.enqueue({ type: "text-delta", id: text.externalId, delta });
     }
   }
 
@@ -343,8 +345,8 @@ function createCopilotResponsesTransform(
     const key = `${itemId}:${contentIndex}`;
 
     if (!openTexts.has(key)) {
-      openTexts.set(key, { itemId, started: true, accum: "" });
-      controller.enqueue({ type: "text-start", id: itemId });
+      openTexts.set(key, { externalId: key, started: true, accum: "" });
+      controller.enqueue({ type: "text-start", id: key });
     }
 
     // Some servers include initial text inline in the content_part.added event
@@ -352,7 +354,7 @@ function createCopilotResponsesTransform(
     if (initialText && initialText.length > 0) {
       const text = openTexts.get(key)!;
       text.accum += initialText;
-      controller.enqueue({ type: "text-delta", id: itemId, delta: initialText });
+      controller.enqueue({ type: "text-delta", id: text.externalId, delta: initialText });
     }
   }
 
@@ -376,7 +378,7 @@ function createCopilotResponsesTransform(
       // Emit any trailing text that the deltas missed
       const trailing = finalText.slice(text.accum.length);
       text.accum = finalText;
-      controller.enqueue({ type: "text-delta", id: itemId, delta: trailing });
+      controller.enqueue({ type: "text-delta", id: text.externalId, delta: trailing });
     }
   }
 
@@ -396,7 +398,7 @@ function createCopilotResponsesTransform(
 
     const text = openTexts.get(key);
     if (text?.started) {
-      controller.enqueue({ type: "text-end", id: itemId });
+      controller.enqueue({ type: "text-end", id: text.externalId });
       openTexts.delete(key);
     }
   }
@@ -459,8 +461,8 @@ function createCopilotResponsesTransform(
     if (itemType === "message") {
       // Fallback: close any text parts that content_part.done did not already close
       for (const [key, text] of openTexts) {
-        if (text.itemId === itemId && text.started) {
-          controller.enqueue({ type: "text-end", id: itemId });
+        if (text.externalId.startsWith(`${itemId}:`) && text.started) {
+          controller.enqueue({ type: "text-end", id: text.externalId });
           openTexts.delete(key);
         }
       }

From f138fc942bf6bf71367ad12b6093196fce3d0bb3 Mon Sep 17 00:00:00 2001
From: Soeren Magnus Olesen <soeren@molesen.ch>
Date: Mon, 16 Mar 2026 07:15:42 +0100
Subject: [PATCH 11/11] fix: normalize oversized tool call IDs for OpenAI
 Responses API

OpenAI's Responses API rejects call_id values longer than 64 chars.
Tool call IDs from other providers or internal systems can exceed this
limit when replayed through convertToModelMessages().

Add request-time normalization in the message pipeline that:
- Scans ModelMessages for tool-call and tool-result parts with IDs >64 chars
- Rewrites them deterministically using SHA-256 hashing (call_ prefix + 59 hex chars)
- Ensures paired tool-call/tool-result parts stay matched
- Does not mutate persisted history (request-only transform)

The normalization runs after sanitizeAssistantModelMessages() and before
provider-specific transforms, covering all providers uniformly.
---
 src/node/services/messagePipeline.ts          |  17 +-
 .../messages/normalizeToolCallIds.test.ts     | 188 ++++++++++++++++++
 .../utils/messages/normalizeToolCallIds.ts    | 109 ++++++++++
 3 files changed, 309 insertions(+), 5 deletions(-)
 create mode 100644 src/node/utils/messages/normalizeToolCallIds.test.ts
 create mode 100644 src/node/utils/messages/normalizeToolCallIds.ts

diff --git a/src/node/services/messagePipeline.ts b/src/node/services/messagePipeline.ts
index 4b0cedd893..7db9790922 100644
--- a/src/node/services/messagePipeline.ts
+++ b/src/node/services/messagePipeline.ts
@@ -29,6 +29,7 @@ import {
   injectPostCompactionAttachments,
 } from "@/browser/utils/messages/modelMessageTransform";
 import { applyCacheControl, type AnthropicCacheTtl } from "@/common/utils/ai/cacheStrategy";
+import { normalizeToolCallIds } from "@/node/utils/messages/normalizeToolCallIds";
 import { log } from "./log";
 
 /** Options for the full message preparation pipeline. */
@@ -81,9 +82,10 @@ export interface PrepareMessagesOptions {
  * 10. Rewriting data-URI file parts to SDK-safe inline base64
  * 11. Converting to Vercel AI SDK ModelMessage format
  * 12. Self-healing: filtering empty/whitespace assistant messages
- * 13. Applying provider-specific message transforms
- * 14. Applying cache control headers
- * 15. Validating Anthropic compliance (logs warnings only)
+ * 13. Normalizing oversized tool call IDs (>64 chars) for OpenAI compatibility
+ * 14. Applying provider-specific message transforms
+ * 15. Applying cache control headers
+ * 16. Validating Anthropic compliance (logs warnings only)
  */
 export async function prepareMessagesForProvider(
   opts: PrepareMessagesOptions
@@ -184,10 +186,15 @@ export async function prepareMessagesForProvider(
 
   const modelMessages = sanitizeAssistantModelMessages(rawModelMessages, workspaceId);
 
-  log.debug_obj(`${workspaceId}/2_model_messages.json`, modelMessages);
+  // Normalize oversized tool call IDs (>64 chars) that would be rejected by
+  // OpenAI's Responses API. Uses deterministic hashing so paired tool-call and
+  // tool-result parts stay matched. Request-only — does not mutate history.
+  const normalizedMessages = normalizeToolCallIds(modelMessages);
+
+  log.debug_obj(`${workspaceId}/2_model_messages.json`, normalizedMessages);
 
   // Apply ModelMessage transforms based on provider requirements
-  const transformedMessages = transformModelMessages(modelMessages, providerForMessages, {
+  const transformedMessages = transformModelMessages(normalizedMessages, providerForMessages, {
     anthropicThinkingEnabled:
       providerForMessages === "anthropic" && effectiveThinkingLevel !== "off",
   });
diff --git a/src/node/utils/messages/normalizeToolCallIds.test.ts b/src/node/utils/messages/normalizeToolCallIds.test.ts
new file mode 100644
index 0000000000..13c54d8dfc
--- /dev/null
+++ b/src/node/utils/messages/normalizeToolCallIds.test.ts
@@ -0,0 +1,188 @@
+import { describe, it, expect } from "@jest/globals";
+import type { ModelMessage } from "ai";
+import { normalizeToolCallIds, shortenToolCallId } from "./normalizeToolCallIds";
+
+/** Helper: a string of exactly `n` characters. */
+function makeId(n: number, prefix = "call_"): string {
+  return prefix + "x".repeat(Math.max(0, n - prefix.length));
+}
+
+describe("shortenToolCallId", () => {
+  it("returns a string of exactly 64 characters", () => {
+    const result = shortenToolCallId("a".repeat(100));
+    expect(result.length).toBe(64);
+  });
+
+  it("starts with call_ prefix", () => {
+    const result = shortenToolCallId("something-very-long");
+    expect(result.startsWith("call_")).toBe(true);
+  });
+
+  it("is deterministic — same input gives same output", () => {
+    const longId = "x".repeat(200);
+    expect(shortenToolCallId(longId)).toBe(shortenToolCallId(longId));
+  });
+
+  it("produces different outputs for different inputs", () => {
+    const a = shortenToolCallId("a".repeat(100));
+    const b = shortenToolCallId("b".repeat(100));
+    expect(a).not.toBe(b);
+  });
+});
+
+describe("normalizeToolCallIds", () => {
+  const shortId = makeId(64); // exactly at the limit — should NOT be rewritten
+  const longId = makeId(65); // one over the limit — should be rewritten
+  const veryLongId = makeId(200); // well over the limit
+
+  it("returns the same array reference when no IDs exceed 64 chars", () => {
+    const messages: ModelMessage[] = [
+      {
+        role: "assistant",
+        content: [{ type: "tool-call", toolCallId: shortId, toolName: "bash", input: {} }],
+      },
+      {
+        role: "tool",
+        content: [
+          {
+            type: "tool-result",
+            toolCallId: shortId,
+            toolName: "bash",
+            output: { type: "text" as const, value: "ok" },
+          },
+        ],
+      },
+    ];
+
+    const result = normalizeToolCallIds(messages);
+    // Same reference means no unnecessary cloning
+    expect(result).toBe(messages);
+  });
+
+  it("rewrites oversized IDs in both tool-call and tool-result parts", () => {
+    const messages: ModelMessage[] = [
+      {
+        role: "assistant",
+        content: [{ type: "tool-call", toolCallId: longId, toolName: "bash", input: {} }],
+      },
+      {
+        role: "tool",
+        content: [
+          {
+            type: "tool-result",
+            toolCallId: longId,
+            toolName: "bash",
+            output: { type: "text" as const, value: "ok" },
+          },
+        ],
+      },
+    ];
+
+    const result = normalizeToolCallIds(messages);
+
+    // Both should have the same normalized ID
+    const assistantContent = result[0].content as Array<{ toolCallId: string }>;
+    const toolContent = result[1].content as Array<{ toolCallId: string }>;
+
+    expect(assistantContent[0].toolCallId.length).toBeLessThanOrEqual(64);
+    expect(toolContent[0].toolCallId.length).toBeLessThanOrEqual(64);
+    expect(assistantContent[0].toolCallId).toBe(toolContent[0].toolCallId);
+  });
+
+  it("preserves IDs that are within the limit alongside oversized ones", () => {
+    const messages: ModelMessage[] = [
+      {
+        role: "assistant",
+        content: [
+          { type: "tool-call", toolCallId: shortId, toolName: "bash", input: {} },
+          { type: "tool-call", toolCallId: veryLongId, toolName: "edit", input: {} },
+        ],
+      },
+      {
+        role: "tool",
+        content: [
+          {
+            type: "tool-result",
+            toolCallId: shortId,
+            toolName: "bash",
+            output: { type: "text" as const, value: "ok" },
+          },
+        ],
+      },
+      {
+        role: "tool",
+        content: [
+          {
+            type: "tool-result",
+            toolCallId: veryLongId,
+            toolName: "edit",
+            output: { type: "text" as const, value: "done" },
+          },
+        ],
+      },
+    ];
+
+    const result = normalizeToolCallIds(messages);
+
+    const assistantContent = result[0].content as Array<{ toolCallId: string }>;
+    const toolContent0 = result[1].content as Array<{ toolCallId: string }>;
+    const toolContent1 = result[2].content as Array<{ toolCallId: string }>;
+
+    // Short ID untouched
+    expect(assistantContent[0].toolCallId).toBe(shortId);
+    expect(toolContent0[0].toolCallId).toBe(shortId);
+
+    // Long ID rewritten
+    expect(assistantContent[1].toolCallId).not.toBe(veryLongId);
+    expect(assistantContent[1].toolCallId.length).toBeLessThanOrEqual(64);
+    // Paired result matches
+    expect(toolContent1[0].toolCallId).toBe(assistantContent[1].toolCallId);
+  });
+
+  it("does not mutate original messages", () => {
+    const originalCallId = longId;
+    const messages: ModelMessage[] = [
+      {
+        role: "assistant",
+        content: [{ type: "tool-call", toolCallId: originalCallId, toolName: "bash", input: {} }],
+      },
+      {
+        role: "tool",
+        content: [
+          {
+            type: "tool-result",
+            toolCallId: originalCallId,
+            toolName: "bash",
+            output: { type: "text" as const, value: "ok" },
+          },
+        ],
+      },
+    ];
+
+    normalizeToolCallIds(messages);
+
+    // Original messages untouched
+    const assistantContent = messages[0].content as Array<{ toolCallId: string }>;
+    const toolContent = messages[1].content as Array<{ toolCallId: string }>;
+    expect(assistantContent[0].toolCallId).toBe(originalCallId);
+    expect(toolContent[0].toolCallId).toBe(originalCallId);
+  });
+
+  it("passes through non-assistant/tool messages unchanged", () => {
+    const userMsg: ModelMessage = { role: "user", content: [{ type: "text", text: "hello" }] };
+    const systemMsg: ModelMessage = { role: "system", content: "system prompt" };
+
+    const messages: ModelMessage[] = [userMsg, systemMsg];
+    const result = normalizeToolCallIds(messages);
+
+    expect(result[0]).toBe(userMsg);
+    expect(result[1]).toBe(systemMsg);
+  });
+
+  it("handles assistant messages with string content (no tool calls)", () => {
+    const messages: ModelMessage[] = [{ role: "assistant", content: "just text" }];
+
+    const result = normalizeToolCallIds(messages);
+    expect(result).toBe(messages);
+  });
+});
diff --git a/src/node/utils/messages/normalizeToolCallIds.ts b/src/node/utils/messages/normalizeToolCallIds.ts
new file mode 100644
index 0000000000..2319fbb26f
--- /dev/null
+++ b/src/node/utils/messages/normalizeToolCallIds.ts
@@ -0,0 +1,109 @@
+/**
+ * Normalize oversized tool call IDs in ModelMessages.
+ *
+ * OpenAI's Responses API rejects `call_id` values longer than 64 characters.
+ * Tool call IDs generated by other providers (or by internal systems) can exceed
+ * this limit. This module rewrites them deterministically so that paired
+ * tool-call and tool-result parts still match after normalization.
+ *
+ * Applied request-only — does not mutate persisted history.
+ */
+
+import { createHash } from "node:crypto";
+import type { ModelMessage } from "ai";
+
+/** OpenAI's maximum allowed length for tool call IDs. */
+const MAX_TOOL_CALL_ID_LENGTH = 64;
+
+/**
+ * Prefix for normalized IDs so they're recognizable in debug logs.
+ * "call_" (5 chars) + 59 chars of hash = 64 chars total.
+ */
+const NORMALIZED_PREFIX = "call_";
+const HASH_LENGTH = MAX_TOOL_CALL_ID_LENGTH - NORMALIZED_PREFIX.length;
+
+/**
+ * Deterministically shorten a tool call ID to fit within the 64-char limit.
+ * Uses SHA-256 (hex) truncated to fill the available space after the prefix.
+ * The same input always produces the same output, so paired tool-call and
+ * tool-result parts will agree on the normalized value.
+ */
+export function shortenToolCallId(id: string): string {
+  const hash = createHash("sha256").update(id).digest("hex");
+  return `${NORMALIZED_PREFIX}${hash.slice(0, HASH_LENGTH)}`;
+}
+
+/**
+ * Build a mapping from oversized tool call IDs to their normalized forms.
+ * Scans all assistant (tool-call) and tool (tool-result) messages once to
+ * collect every ID that exceeds the limit.
+ */
+function buildIdMapping(messages: ModelMessage[]): Map<string, string> {
+  const oversizedIds = new Set<string>();
+
+  for (const msg of messages) {
+    if (msg.role === "assistant" && Array.isArray(msg.content)) {
+      for (const part of msg.content) {
+        if (part.type === "tool-call" && part.toolCallId.length > MAX_TOOL_CALL_ID_LENGTH) {
+          oversizedIds.add(part.toolCallId);
+        }
+      }
+    } else if (msg.role === "tool") {
+      for (const part of msg.content) {
+        if (part.type === "tool-result" && part.toolCallId.length > MAX_TOOL_CALL_ID_LENGTH) {
+          oversizedIds.add(part.toolCallId);
+        }
+      }
+    }
+  }
+
+  const mapping = new Map<string, string>();
+  for (const id of oversizedIds) {
+    mapping.set(id, shortenToolCallId(id));
+  }
+  return mapping;
+}
+
+/**
+ * Rewrite oversized tool call IDs in the given ModelMessages.
+ *
+ * Returns a new array (shallow copy) with only the affected parts cloned and
+ * rewritten. Messages without oversized IDs are passed through unchanged.
+ *
+ * This is a request-only transform — it does not mutate the original messages
+ * or persisted history.
+ */
+export function normalizeToolCallIds(messages: ModelMessage[]): ModelMessage[] {
+  const mapping = buildIdMapping(messages);
+  if (mapping.size === 0) {
+    return messages;
+  }
+
+  return messages.map((msg): ModelMessage => {
+    if (msg.role === "assistant" && Array.isArray(msg.content)) {
+      let changed = false;
+      const newContent = msg.content.map((part) => {
+        if (part.type === "tool-call" && mapping.has(part.toolCallId)) {
+          changed = true;
+          return { ...part, toolCallId: mapping.get(part.toolCallId)! };
+        }
+        return part;
+      });
+      return changed ? { ...msg, content: newContent } : msg;
+    }
+
+    if (msg.role === "tool") {
+      let changed = false;
+      const newContent = msg.content.map((part) => {
+        if (part.type === "tool-result" && mapping.has(part.toolCallId)) {
+          changed = true;
+          return { ...part, toolCallId: mapping.get(part.toolCallId)! };
+        }
+        return part;
+      });
+      return changed ? { ...msg, content: newContent } : msg;
+    }
+
+    return msg;
+  });
+}