Fix auto model for engine (#2170)

 > [!NOTE] > Fixes auto/local-agent model routing and provider-specific behavior. > > - Refactors `llm_engine_provider` to require `chatParams { providerId }`; wires it into custom fetch and model constructors (`provider`, `chatModel`, `responses`) > - Updates `get_model_client` to pass `providerId`, tag fallback models (`openai`, `anthropic`, `google`), and use `responses()` for OpenAI in `local-agent` and auto fallback > - Adds Responses API support to fake LLM server (`/v1/responses`) with streaming SSE handler and dump generation > - Extends test helper to parse Responses API dumps (`body.input`) and adds `localAgentUseAutoModel` setup flag > - New e2e test `local_agent_auto.spec.ts` with snapshot verifying request payload via Responses API > > <sup>Written by [Cursor Bugbot](https://cursor.com/dashboard?tab=bugbot) for commit e5b02d253c9842f14da0099bb11e1b05548e9245. This will update automatically on new commits. Configure [here](https://cursor.com/dashboard?tab=bugbot).</sup>   --- ## Summary by cubic Fixes auto model selection in the Dyad engine by passing the correct providerId with each request. Ensures provider-specific options are applied and avoids incorrect defaults. - **Bug Fixes** - Pass providerId to chat/responses models and into the fetch layer for getExtraProviderOptions. - Remove originalProviderId from createDyadEngine; add ChatParams and update provider API signatures. - Tag fallback models with providerId (openai, anthropic, google) and forward model.provider in getModelClient. <sup>Written for commit e5b02d253c9842f14da0099bb11e1b05548e9245. Summary will update on new commits.</sup>

Fix auto model for engine (#2170)
759c60f2 · Will Chen · GitHub · be7b6977 · 759c60f2 · 759c60f2
--- a/e2e-tests/helpers/test_helper.ts
+++ b/e2e-tests/helpers/test_helper.ts
@@ -315,7 +315,12 @@ export class PageObject {
  async setUpDyadPro({
    autoApprove = false,
    localAgent = false,
-  }: { autoApprove?: boolean; localAgent?: boolean } = {}) {
+    localAgentUseAutoModel = false,
+  }: {
+    autoApprove?: boolean;
+    localAgent?: boolean;
+    localAgentUseAutoModel?: boolean;
+  } = {}) {
    await this.baseSetup();
    await this.goToSettingsTab();
    if (autoApprove) {
@@ -328,7 +333,7 @@ export class PageObject {
    await this.goToAppsTab();
    // Select a non-openAI model for local agent mode,
    // since openAI models go to the responses API.
-    if (localAgent) {
+    if (localAgent && !localAgentUseAutoModel) {
      await this.selectModel({
        provider: "Anthropic",
        model: "Claude Opus 4.5",
@@ -800,6 +805,17 @@ export class PageObject {
    // Perform snapshot comparison
    const parsedDump = JSON.parse(dumpContent);
    if (type === "request") {
+      if (parsedDump["body"]["input"]) {
+        parsedDump["body"]["input"] = parsedDump["body"]["input"].map(
+          (input: any) => {
+            if (input.role === "system") {
+              input.content = "[[SYSTEM_MESSAGE]]";
+            }
+            return input;
+          },
+        );
+      }
+      if (parsedDump["body"]["messages"]) {
        parsedDump["body"]["messages"] = parsedDump["body"]["messages"].map(
          (message: any) => {
            if (message.role === "system") {
@@ -808,6 +824,7 @@ export class PageObject {
            return message;
          },
        );
+      }
      // Normalize fileIds to be deterministic based on content
      normalizeVersionedFiles(parsedDump);
      expect(
@@ -816,9 +833,15 @@ export class PageObject {
      return;
    }
    expect(
-      prettifyDump(parsedDump["body"]["messages"], {
+      prettifyDump(
+        // responses API
+        parsedDump["body"]["input"] ??
+          // chat completion API
+          parsedDump["body"]["messages"],
+        {
          onlyLastMessage: type === "last-message",
-      }),
+        },
+      ),
    ).toMatchSnapshot(name);
  }


--- a/e2e-tests/local_agent_auto.spec.ts
+++ b/e2e-tests/local_agent_auto.spec.ts
+import { testSkipIfWindows } from "./helpers/test_helper";
+
+testSkipIfWindows("local-agent - auto model", async ({ po }) => {
+  await po.setUpDyadPro({ localAgent: true, localAgentUseAutoModel: true });
+  await po.importApp("minimal");
+  await po.selectLocalAgentMode();
+
+  await po.sendPrompt("[dump]");
+  await po.snapshotServerDump("request");
+});
--- a/e2e-tests/snapshots/local_agent_auto.spec.ts_local-agent---auto-model-1.txt
+++ b/e2e-tests/snapshots/local_agent_auto.spec.ts_local-agent---auto-model-1.txt
--- a/src/ipc/utils/get_model_client.ts
+++ b/src/ipc/utils/get_model_client.ts
@@ -91,7 +91,6 @@ export async function getModelClient(
      const provider = createDyadEngine({
        apiKey: dyadApiKey,
        baseURL: dyadEngineUrl ?? "https://engine.dyad.sh/v1",
-        originalProviderId: model.provider,
        dyadOptions: {
          enableLazyEdits:
            settings.selectedChatMode === "ask"
@@ -214,12 +213,13 @@ function getProModelClient({
      model: createFallback({
        models: [
          // openai requires no prefix.
-          provider.responses(`${GPT_5_2_MODEL_NAME}`),
-          provider(`anthropic/${SONNET_4_5}`),
-          provider(`gemini/${GEMINI_3_FLASH}`),
+          provider.responses(`${GPT_5_2_MODEL_NAME}`, { providerId: "openai" }),
+          provider(`anthropic/${SONNET_4_5}`, { providerId: "anthropic" }),
+          provider(`gemini/${GEMINI_3_FLASH}`, { providerId: "google" }),
        ],
      }),
      // Using openAI as the default provider.
+      // TODO: we should remove this and rely on the provider id passed into the provider().
      builtinProviderId: "openai",
    };
  }
@@ -228,12 +228,12 @@ function getProModelClient({
    model.provider === "openai"
  ) {
    return {
-      model: provider.responses(modelId),
+      model: provider.responses(modelId, { providerId: model.provider }),
      builtinProviderId: model.provider,
    };
  }
  return {
-    model: provider(modelId),
+    model: provider(modelId, { providerId: model.provider }),
    builtinProviderId: model.provider,
  };
 }

--- a/src/ipc/utils/llm_engine_provider.ts
+++ b/src/ipc/utils/llm_engine_provider.ts
@@ -14,7 +14,9 @@ import type { LanguageModel } from "ai";
 const logger = log.scope("llm_engine_provider");

 export type ExampleChatModelId = string & {};
-export interface ExampleChatSettings {}
+export interface ChatParams {
+  providerId: string;
+}
 export interface ExampleProviderSettings {
  /**
 Example API key.
@@ -38,7 +40,6 @@ or to provide a custom fetch implementation for e.g. testing.
 */
  fetch?: FetchFunction;

-  originalProviderId: string;
  dyadOptions: {
    enableLazyEdits?: boolean;
    enableSmartFilesContext?: boolean;
@@ -51,17 +52,14 @@ export interface DyadEngineProvider {
  /**
 Creates a model for text generation.
 */
-  (modelId: ExampleChatModelId, settings?: ExampleChatSettings): LanguageModel;
+  (modelId: ExampleChatModelId, chatParams: ChatParams): LanguageModel;

  /**
 Creates a chat model for text generation.
 */
-  chatModel(
-    modelId: ExampleChatModelId,
-    settings?: ExampleChatSettings,
-  ): LanguageModel;
+  chatModel(modelId: ExampleChatModelId, chatParams: ChatParams): LanguageModel;

-  responses(modelId: ExampleChatModelId): LanguageModel;
+  responses(modelId: ExampleChatModelId, chatParams: ChatParams): LanguageModel;
 }

 export function createDyadEngine(
@@ -103,7 +101,11 @@ export function createDyadEngine(
  });

  // Custom fetch implementation that adds dyad-specific options to the request
-  const createDyadFetch = (): FetchFunction => {
+  const createDyadFetch = ({
+    providerId,
+  }: {
+    providerId: string;
+  }): FetchFunction => {
    return (input: RequestInfo | URL, init?: RequestInit) => {
      // Use default fetch if no init or body
      if (!init || !init.body || typeof init.body !== "string") {
@@ -114,10 +116,7 @@ export function createDyadEngine(
        // Parse the request body to manipulate it
        const parsedBody = {
          ...JSON.parse(init.body),
-          ...getExtraProviderOptions(
-            options.originalProviderId,
-            options.settings,
-          ),
+          ...getExtraProviderOptions(providerId, options.settings),
        };
        const dyadVersionedFiles = parsedBody.dyadVersionedFiles;
        if ("dyadVersionedFiles" in parsedBody) {
@@ -195,25 +194,32 @@ export function createDyadEngine(
    };
  };

-  const createChatModel = (modelId: ExampleChatModelId) => {
+  const createChatModel = (
+    modelId: ExampleChatModelId,
+    chatParams: ChatParams,
+  ) => {
    const config = {
      ...getCommonModelConfig(),
-      fetch: createDyadFetch(),
+      fetch: createDyadFetch({ providerId: chatParams.providerId }),
    };

    return new OpenAICompatibleChatLanguageModel(modelId, config);
  };

-  const createResponsesModel = (modelId: ExampleChatModelId) => {
+  const createResponsesModel = (
+    modelId: ExampleChatModelId,
+    chatParams: ChatParams,
+  ) => {
    const config = {
      ...getCommonModelConfig(),
-      fetch: createDyadFetch(),
+      fetch: createDyadFetch({ providerId: chatParams.providerId }),
    };

    return new OpenAIResponsesLanguageModel(modelId, config);
  };

-  const provider = (modelId: ExampleChatModelId) => createChatModel(modelId);
+  const provider = (modelId: ExampleChatModelId, chatParams: ChatParams) =>
+    createChatModel(modelId, chatParams);

  provider.chatModel = createChatModel;
  provider.responses = createResponsesModel;

--- a/testing/fake-llm-server/index.ts
+++ b/testing/fake-llm-server/index.ts
@@ -2,6 +2,7 @@ import express from "express";
 import { createServer } from "http";
 import cors from "cors";
 import { createChatCompletionHandler } from "./chatCompletionHandler";
+import { createResponsesHandler } from "./responsesHandler";
 import {
  handleDeviceCode,
  handleAccessToken,
@@ -152,6 +153,8 @@ app.get("/lmstudio/api/v0/models", (req, res) => {
    `/${provider}/v1/chat/completions`,
    createChatCompletionHandler(provider),
  );
+  // Also add responses API endpoints for each provider
+  app.post(`/${provider}/v1/responses`, createResponsesHandler(provider));
 });

 // Azure-specific endpoints (Azure client uses different URL patterns)
@@ -163,6 +166,7 @@ app.post(

 // Default test provider handler:
 app.post("/v1/chat/completions", createChatCompletionHandler("."));
+app.post("/v1/responses", createResponsesHandler("."));

 // GitHub API Mock Endpoints
 console.log("Setting up GitHub mock endpoints");

--- a/testing/fake-llm-server/responsesHandler.ts
+++ b/testing/fake-llm-server/responsesHandler.ts