fix(anthropic): default model options (#9221)

hntrl · web-flow · commit 3cfc4fbd5561 · 2025-10-17T01:27:41.000-07:00
diff --git a/libs/langchain-standard-tests/src/integration_tests/chat_models.ts b/libs/langchain-standard-tests/src/integration_tests/chat_models.ts
@@ -1227,8 +1227,6 @@ export abstract class ChatModelIntegrationTests<
       callOptionsWithHandler
     );
 
-    console.log("result", handler.extraParams, handler);
-
     // Verify that the 'a' field is present and is a number
     this.expect(result.a).toBeDefined();
     this.expect(typeof result.a).toBe("number");
diff --git a/libs/langchain/src/agents/middleware/modelFallback.ts b/libs/langchain/src/agents/middleware/modelFallback.ts
@@ -17,7 +17,7 @@ import { createMiddleware } from "../middleware.js";
  * // Create middleware with fallback models (not including primary)
  * const fallback = modelFallbackMiddleware({
  *   "openai:gpt-4o-mini",  // First fallback
- *   "anthropic:claude-3-5-sonnet-20241022",  // Second fallback
+ *   "anthropic:claude-sonnet-4-5-20250929",  // Second fallback
  * });
  *
  * const agent = createAgent({
diff --git a/libs/providers/langchain-anthropic/src/chat_models.ts b/libs/providers/langchain-anthropic/src/chat_models.ts
@@ -49,6 +49,29 @@ import {
 } from "./types.js";
 import { wrapAnthropicClientError } from "./utils/errors.js";
 
+const MODEL_DEFAULT_MAX_OUTPUT_TOKENS: Partial<
+  Record<Anthropic.Model, number>
+> = {
+  "claude-opus-4-1": 8192,
+  "claude-opus-4": 8192,
+  "claude-sonnet-4": 8192,
+  "claude-sonnet-3-7-sonnet": 8192,
+  "claude-3-5-sonnet": 4096,
+  "claude-3-5-haiku": 4096,
+  "claude-3-haiku": 2048,
+};
+const FALLBACK_MAX_OUTPUT_TOKENS = 2048;
+
+function defaultMaxOutputTokensForModel(model?: Anthropic.Model): number {
+  if (!model) {
+    return FALLBACK_MAX_OUTPUT_TOKENS;
+  }
+  const maxTokens = Object.entries(MODEL_DEFAULT_MAX_OUTPUT_TOKENS).find(
+    ([key]) => model.startsWith(key)
+  )?.[1];
+  return maxTokens ?? FALLBACK_MAX_OUTPUT_TOKENS;
+}
+
 export interface ChatAnthropicCallOptions
   extends BaseChatModelCallOptions,
     Pick<AnthropicInput, "streamUsage"> {
@@ -144,40 +167,36 @@ export type AnthropicMessagesModelId =
  * Input to AnthropicChat class.
  */
 export interface AnthropicInput {
-  /** Amount of randomness injected into the response. Ranges
-   * from 0 to 1. Use temp closer to 0 for analytical /
-   * multiple choice, and temp closer to 1 for creative
+  /**
+   * Amount of randomness injected into the response. Ranges
+   * from 0 to 1. Use temperature closer to 0 for analytical /
+   * multiple choice, and temperature closer to 1 for creative
    * and generative tasks.
-   * To not set this field, pass `null`. If `undefined` is passed,
-   * the default (1) will be used.
    */
-  temperature?: number | null;
+  temperature?: number;
 
-  /** Only sample from the top K options for each subsequent
+  /**
+   * Only sample from the top K options for each subsequent
    * token. Used to remove "long tail" low probability
-   * responses. Defaults to -1, which disables it.
+   * responses.
    */
   topK?: number;
 
-  /** Does nucleus sampling, in which we compute the
+  /**
+   * Does nucleus sampling, in which we compute the
    * cumulative distribution over all the options for each
    * subsequent token in decreasing probability order and
    * cut it off once it reaches a particular probability
-   * specified by top_p. Defaults to -1, which disables it.
-   * Note that you should either alter temperature or top_p,
-   * but not both.
-   *
-   * To not set this field, pass `null`. If `undefined` is passed,
-   * the default (-1) will be used.
-   *
-   * For Opus 4.1 and Sonnet 4.5, this defaults to `null`.
+   * specified by top_p. Note that you should either alter
+   * temperature or top_p, but not both.
    */
   topP?: number | null;
 
   /** A maximum number of tokens to generate before stopping. */
   maxTokens?: number;
 
-  /** A list of strings upon which to stop generating.
+  /**
+   * A list of strings upon which to stop generating.
    * You probably want `["\n\nHuman:"]`, as that's the cue for
    * the next turn in the dialog agent.
    */
@@ -304,7 +323,7 @@ function extractToken(chunk: AIMessageChunk): string | undefined {
  * import { ChatAnthropic } from '@langchain/anthropic';
  *
  * const llm = new ChatAnthropic({
- *   model: "claude-3-5-sonnet-20240620",
+ *   model: "claude-sonnet-4-5-20250929",
  *   temperature: 0,
  *   maxTokens: undefined,
  *   maxRetries: 2,
@@ -334,7 +353,7 @@ function extractToken(chunk: AIMessageChunk): string | undefined {
  *   "content": "Here's the translation to French:\n\nJ'adore la programmation.",
  *   "response_metadata": {
  *     "id": "msg_01QDpd78JUHpRP6bRRNyzbW3",
- *     "model": "claude-3-5-sonnet-20240620",
+ *     "model": "claude-sonnet-4-5-20250929",
  *     "stop_reason": "end_turn",
  *     "stop_sequence": null,
  *     "usage": {
@@ -372,7 +391,7 @@ function extractToken(chunk: AIMessageChunk): string | undefined {
  *     "id": "msg_01N8MwoYxiKo9w4chE4gXUs4",
  *     "type": "message",
  *     "role": "assistant",
- *     "model": "claude-3-5-sonnet-20240620"
+ *     "model": "claude-sonnet-4-5-20250929"
  *   },
  *   "usage_metadata": {
  *     "input_tokens": 25,
@@ -441,7 +460,7 @@ function extractToken(chunk: AIMessageChunk): string | undefined {
  *     "id": "msg_01SBTb5zSGXfjUc7yQ8EKEEA",
  *     "type": "message",
  *     "role": "assistant",
- *     "model": "claude-3-5-sonnet-20240620",
+ *     "model": "claude-sonnet-4-5-20250929",
  *     "stop_reason": "end_turn",
  *     "stop_sequence": null
  *   },
@@ -626,7 +645,7 @@ function extractToken(chunk: AIMessageChunk): string | undefined {
  * ```txt
  * {
  *   id: 'msg_01STxeQxJmp4sCSpioD6vK3L',
- *   model: 'claude-3-5-sonnet-20240620',
+ *   model: 'claude-sonnet-4-5-20250929',
  *   stop_reason: 'end_turn',
  *   stop_sequence: null,
  *   usage: { input_tokens: 25, output_tokens: 19 },
@@ -669,17 +688,17 @@ export class ChatAnthropicMessages<
 
   apiUrl?: string;
 
-  temperature: number | undefined = 1;
+  temperature?: number;
 
-  topK = -1;
+  topK?: number;
 
-  topP: number | undefined = -1;
+  topP?: number;
 
-  maxTokens = 2048;
+  maxTokens: number;
 
-  modelName = "claude-2.1";
+  modelName = "claude-3-5-sonnet-latest";
 
-  model = "claude-2.1";
+  model = "claude-3-5-sonnet-latest";
 
   invocationKwargs?: Kwargs;
 
@@ -732,21 +751,12 @@ export class ChatAnthropicMessages<
 
     this.invocationKwargs = fields?.invocationKwargs ?? {};
 
-    if (this.model.includes("opus-4-1") || this.model.includes("sonnet-4-5")) {
-      // Default to `undefined` for `topP` for Opus 4.1 models
-      this.topP = fields?.topP === null ? undefined : fields?.topP;
-    } else {
-      this.topP = fields?.topP ?? this.topP;
-    }
+    this.topP = fields?.topP ?? this.topP;
 
-    // If the user passes `null`, set it to `undefined`. Otherwise, use their value or the default. We have to check for null, because
-    // there's no way for us to know if they explicitly set it to `undefined`, or never passed a value
-    this.temperature =
-      fields?.temperature === null
-        ? undefined
-        : fields?.temperature ?? this.temperature;
+    this.temperature = fields?.temperature ?? this.temperature;
     this.topK = fields?.topK ?? this.topK;
-    this.maxTokens = fields?.maxTokens ?? this.maxTokens;
+    this.maxTokens =
+      fields?.maxTokens ?? defaultMaxOutputTokensForModel(this.model);
     this.stopSequences = fields?.stopSequences ?? this.stopSequences;
 
     this.streaming = fields?.streaming ?? false;
@@ -847,17 +857,10 @@ export class ChatAnthropicMessages<
       | undefined = handleToolChoice(options?.tool_choice);
 
     if (this.thinking.type === "enabled") {
-      if (this.topK !== -1) {
+      if (this.topP !== undefined && this.topK !== -1) {
         throw new Error("topK is not supported when thinking is enabled");
       }
-      if (
-        this.model.includes("opus-4-1") || this.model.includes("sonnet-4-5")
-          ? this.topP !== undefined
-          : this.topP !== -1
-      ) {
-        throw new Error("topP is not supported when thinking is enabled");
-      }
-      if (this.temperature !== 1) {
+      if (this.temperature !== undefined && this.temperature !== 1) {
         throw new Error(
           "temperature is not supported when thinking is enabled"
         );
@@ -999,7 +1002,6 @@ export class ChatAnthropicMessages<
       content,
       additionalKwargs
     );
-    // eslint-disable-next-line @typescript-eslint/no-unused-vars
     const { role: _role, type: _type, ...rest } = additionalKwargs;
     return { generations, llmOutput: rest };
   }
diff --git a/libs/providers/langchain-anthropic/src/tests/chat_models-web_search.int.test.ts b/libs/providers/langchain-anthropic/src/tests/chat_models-web_search.int.test.ts
@@ -3,7 +3,7 @@ import { HumanMessage, AIMessage } from "@langchain/core/messages";
 import { ChatAnthropic } from "../chat_models.js";
 
 const model = new ChatAnthropic({
-  model: "claude-3-5-sonnet-20241022",
+  model: "claude-sonnet-4-5-20250929",
   temperature: 0,
 }).bindTools([
   {
diff --git a/libs/providers/langchain-anthropic/src/tests/chat_models.int.test.ts b/libs/providers/langchain-anthropic/src/tests/chat_models.int.test.ts
@@ -1,6 +1,6 @@
 /* eslint-disable @typescript-eslint/no-explicit-any */
 
-import { expect, test, describe } from "vitest";
+import { expect, test, it, describe } from "vitest";
 import fs from "fs/promises";
 import {
   AIMessage,
@@ -58,7 +58,7 @@ async function invoke(
 const extendedThinkingModelName = "claude-3-7-sonnet-20250219";
 
 // use this for tests involving citations
-const citationsModelName = "claude-3-5-sonnet-20241022";
+const citationsModelName = "claude-sonnet-4-5-20250929";
 
 // use this for tests involving PDF documents
 const pdfModelName = "claude-3-5-haiku-20241022";
@@ -987,7 +987,7 @@ test("Can accept PDF documents", async () => {
   });
 
   const pdfPath =
-    "../langchain-community/src/document_loaders/tests/example_data/Jacob_Lee_Resume_2023.pdf";
+    "../../langchain-community/src/document_loaders/tests/example_data/Jacob_Lee_Resume_2023.pdf";
   const pdfBase64 = await fs.readFile(pdfPath, "base64");
 
   const response = await model.invoke([
diff --git a/libs/providers/langchain-anthropic/src/tests/chat_models.standard.int.test.ts b/libs/providers/langchain-anthropic/src/tests/chat_models.standard.int.test.ts
@@ -34,7 +34,7 @@ class ChatAnthropicStandardIntegrationTests extends ChatModelIntegrationTests<
     const constructorArgsCopy = { ...this.constructorArgs };
     this.constructorArgs = {
       ...this.constructorArgs,
-      model: "claude-3-5-sonnet-20240620",
+      model: "claude-sonnet-4-5-20250929",
     };
     await super.testParallelToolCalling();
     this.constructorArgs = constructorArgsCopy;
diff --git a/libs/providers/langchain-anthropic/src/utils/prompts.ts b/libs/providers/langchain-anthropic/src/utils/prompts.ts
@@ -29,7 +29,7 @@ import { _convertMessagesToAnthropicPayload } from "./message_inputs.js";
  * });
  *
  * const anthropicResponse = await anthropicClient.messages.create({
- *   model: "claude-3-5-sonnet-20240620",
+ *   model: "claude-sonnet-4-5-20250929",
  *   max_tokens: 1024,
  *   stream: false,
  *   system,

Original file line number	Diff line number	Diff line change
`@@ -17,7 +17,7 @@ import { createMiddleware } from "../middleware.js";`
`17`	`17`	`* // Create middleware with fallback models (not including primary)`
`18`	`18`	`* const fallback = modelFallbackMiddleware({`
`19`	`19`	`* "openai:gpt-4o-mini", // First fallback`
`20`		`- * "anthropic:claude-3-5-sonnet-20241022", // Second fallback`
	`20`	`+ * "anthropic:claude-sonnet-4-5-20250929", // Second fallback`
`21`	`21`	`* });`
`22`	`22`	`*`
`23`	`23`	`* const agent = createAgent({`
Original file line number	Diff line number	Diff line change
`@@ -3,7 +3,7 @@ import { HumanMessage, AIMessage } from "@langchain/core/messages";`
`3`	`3`	`import { ChatAnthropic } from "../chat_models.js";`
`4`	`4`
`5`	`5`	`const model = new ChatAnthropic({`
`6`		`- model: "claude-3-5-sonnet-20241022",`
	`6`	`+ model: "claude-sonnet-4-5-20250929",`
`7`	`7`	`temperature: 0,`
`8`	`8`	`}).bindTools([`
`9`	`9`	`{`
Original file line number	Diff line number	Diff line change
`@@ -29,7 +29,7 @@ import { _convertMessagesToAnthropicPayload } from "./message_inputs.js";`
`29`	`29`	`* });`
`30`	`30`	`*`
`31`	`31`	`* const anthropicResponse = await anthropicClient.messages.create({`
`32`		`- * model: "claude-3-5-sonnet-20240620",`
	`32`	`+ * model: "claude-sonnet-4-5-20250929",`
`33`	`33`	`* max_tokens: 1024,`
`34`	`34`	`* stream: false,`
`35`	`35`	`* system,`