Fixes #3849 Add Thinking Config to the Google Gen AI Module

ddobrin · ddobrin · commit 237e5d3b9bdb · 2025-07-24T21:52:18.000-04:00
Signed-off-by: ddobrin &lt;ddobrin@google.com&gt;
diff --git a/models/spring-ai-google-genai/src/main/java/org/springframework/ai/google/genai/GoogleGenAiChatModel.java b/models/spring-ai-google-genai/src/main/java/org/springframework/ai/google/genai/GoogleGenAiChatModel.java
@@ -38,6 +38,7 @@
 import com.google.genai.types.Part;
 import com.google.genai.types.SafetySetting;
 import com.google.genai.types.Schema;
+import com.google.genai.types.ThinkingConfig;
 import com.google.genai.types.Tool;
 import com.google.genai.types.FinishReason;
 import io.micrometer.observation.Observation;
@@ -672,6 +673,10 @@ GeminiRequest createGeminiRequest(Prompt prompt) {
 		if (requestOptions.getPresencePenalty() != null) {
 			configBuilder.presencePenalty(requestOptions.getPresencePenalty().floatValue());
 		}
+		if (requestOptions.getThinkingBudget() != null) {
+			configBuilder
+				.thinkingConfig(ThinkingConfig.builder().thinkingBudget(requestOptions.getThinkingBudget()).build());
+		}
 
 		// Add safety settings
 		if (!CollectionUtils.isEmpty(requestOptions.getSafetySettings())) {
diff --git a/models/spring-ai-google-genai/src/main/java/org/springframework/ai/google/genai/GoogleGenAiChatOptions.java b/models/spring-ai-google-genai/src/main/java/org/springframework/ai/google/genai/GoogleGenAiChatOptions.java
@@ -107,6 +107,12 @@ public class GoogleGenAiChatOptions implements ToolCallingChatOptions {
 	 */
 	private @JsonProperty("presencePenalty") Double presencePenalty;
 
+	/**
+	 * Optional. Thinking budget for the thinking process.
+	 * This is part of the thinkingConfig in GenerationConfig.
+	 */
+	private @JsonProperty("thinkingBudget") Integer thinkingBudget;
+
 	/**
 	 * Collection of {@link ToolCallback}s to be used for tool calling in the chat
 	 * completion requests.
@@ -163,6 +169,7 @@ public static GoogleGenAiChatOptions fromOptions(GoogleGenAiChatOptions fromOpti
 		options.setSafetySettings(fromOptions.getSafetySettings());
 		options.setInternalToolExecutionEnabled(fromOptions.getInternalToolExecutionEnabled());
 		options.setToolContext(fromOptions.getToolContext());
+		options.setThinkingBudget(fromOptions.getThinkingBudget());
 		return options;
 	}
 
@@ -300,6 +307,14 @@ public void setPresencePenalty(Double presencePenalty) {
 		this.presencePenalty = presencePenalty;
 	}
 
+	public Integer getThinkingBudget() {
+		return this.thinkingBudget;
+	}
+
+	public void setThinkingBudget(Integer thinkingBudget) {
+		this.thinkingBudget = thinkingBudget;
+	}
+
 	public Boolean getGoogleSearchRetrieval() {
 		return this.googleSearchRetrieval;
 	}
@@ -341,6 +356,7 @@ public boolean equals(Object o) {
 				&& Objects.equals(this.topK, that.topK) && Objects.equals(this.candidateCount, that.candidateCount)
 				&& Objects.equals(this.frequencyPenalty, that.frequencyPenalty)
 				&& Objects.equals(this.presencePenalty, that.presencePenalty)
+				&& Objects.equals(this.thinkingBudget, that.thinkingBudget)
 				&& Objects.equals(this.maxOutputTokens, that.maxOutputTokens) && Objects.equals(this.model, that.model)
 				&& Objects.equals(this.responseMimeType, that.responseMimeType)
 				&& Objects.equals(this.toolCallbacks, that.toolCallbacks)
@@ -353,20 +369,20 @@ public boolean equals(Object o) {
 	@Override
 	public int hashCode() {
 		return Objects.hash(this.stopSequences, this.temperature, this.topP, this.topK, this.candidateCount,
-				this.frequencyPenalty, this.presencePenalty, this.maxOutputTokens, this.model, this.responseMimeType,
-				this.toolCallbacks, this.toolNames, this.googleSearchRetrieval, this.safetySettings,
-				this.internalToolExecutionEnabled, this.toolContext);
+				this.frequencyPenalty, this.presencePenalty, this.thinkingBudget, this.maxOutputTokens, this.model,
+				this.responseMimeType, this.toolCallbacks, this.toolNames, this.googleSearchRetrieval,
+				this.safetySettings, this.internalToolExecutionEnabled, this.toolContext);
 	}
 
 	@Override
 	public String toString() {
 		return "GoogleGenAiChatOptions{" + "stopSequences=" + this.stopSequences + ", temperature=" + this.temperature
 				+ ", topP=" + this.topP + ", topK=" + this.topK + ", frequencyPenalty=" + this.frequencyPenalty
-				+ ", presencePenalty=" + this.presencePenalty + ", candidateCount=" + this.candidateCount
-				+ ", maxOutputTokens=" + this.maxOutputTokens + ", model='" + this.model + '\'' + ", responseMimeType='"
-				+ this.responseMimeType + '\'' + ", toolCallbacks=" + this.toolCallbacks + ", toolNames="
-				+ this.toolNames + ", googleSearchRetrieval=" + this.googleSearchRetrieval + ", safetySettings="
-				+ this.safetySettings + '}';
+				+ ", presencePenalty=" + this.presencePenalty + ", thinkingBudget=" + this.thinkingBudget
+				+ ", candidateCount=" + this.candidateCount + ", maxOutputTokens=" + this.maxOutputTokens + ", model='"
+				+ this.model + '\'' + ", responseMimeType='" + this.responseMimeType + '\'' + ", toolCallbacks="
+				+ this.toolCallbacks + ", toolNames=" + this.toolNames + ", googleSearchRetrieval="
+				+ this.googleSearchRetrieval + ", safetySettings=" + this.safetySettings + '}';
 	}
 
 	@Override
@@ -489,6 +505,11 @@ public Builder toolContext(Map<String, Object> toolContext) {
 			return this;
 		}
 
+		public Builder thinkingBudget(Integer thinkingBudget) {
+			this.options.setThinkingBudget(thinkingBudget);
+			return this;
+		}
+
 		public GoogleGenAiChatOptions build() {
 			return this.options;
 		}
diff --git a/models/spring-ai-google-genai/src/test/java/org/springframework/ai/google/genai/CreateGeminiRequestTests.java b/models/spring-ai-google-genai/src/test/java/org/springframework/ai/google/genai/CreateGeminiRequestTests.java
@@ -30,6 +30,8 @@
 
 import org.springframework.ai.chat.messages.SystemMessage;
 import org.springframework.ai.chat.messages.UserMessage;
+import org.springframework.ai.chat.metadata.ChatResponseMetadata;
+import org.springframework.ai.chat.model.ChatResponse;
 import org.springframework.ai.chat.prompt.Prompt;
 import org.springframework.ai.content.Media;
 import org.springframework.ai.model.tool.ToolCallingChatOptions;
@@ -299,4 +301,45 @@ public void createRequestWithGenerationConfigOptions() {
 		assertThat(request.config().responseMimeType().orElse("")).isEqualTo("application/json");
 	}
 
+	@Test
+	public void createRequestWithThinkingBudget() {
+
+		var client = GoogleGenAiChatModel.builder()
+			.genAiClient(this.genAiClient)
+			.defaultOptions(GoogleGenAiChatOptions.builder().model("DEFAULT_MODEL").thinkingBudget(12853).build())
+			.build();
+
+		GeminiRequest request = client
+			.createGeminiRequest(client.buildRequestPrompt(new Prompt("Test message content")));
+
+		assertThat(request.contents()).hasSize(1);
+		assertThat(request.modelName()).isEqualTo("DEFAULT_MODEL");
+
+		// Verify thinkingConfig is present and contains thinkingBudget
+		assertThat(request.config().thinkingConfig()).isPresent();
+		assertThat(request.config().thinkingConfig().get().thinkingBudget()).isPresent();
+		assertThat(request.config().thinkingConfig().get().thinkingBudget().get()).isEqualTo(12853);
+	}
+
+	@Test
+	public void createRequestWithThinkingBudgetOverride() {
+
+		var client = GoogleGenAiChatModel.builder()
+			.genAiClient(this.genAiClient)
+			.defaultOptions(GoogleGenAiChatOptions.builder().model("DEFAULT_MODEL").thinkingBudget(10000).build())
+			.build();
+
+		// Override default thinkingBudget with prompt-specific value
+		GeminiRequest request = client.createGeminiRequest(client.buildRequestPrompt(
+				new Prompt("Test message content", GoogleGenAiChatOptions.builder().thinkingBudget(25000).build())));
+
+		assertThat(request.contents()).hasSize(1);
+		assertThat(request.modelName()).isEqualTo("DEFAULT_MODEL");
+
+		// Verify prompt-specific thinkingBudget overrides default
+		assertThat(request.config().thinkingConfig()).isPresent();
+		assertThat(request.config().thinkingConfig().get().thinkingBudget()).isPresent();
+		assertThat(request.config().thinkingConfig().get().thinkingBudget().get()).isEqualTo(25000);
+	}
+
 }
diff --git a/models/spring-ai-google-genai/src/test/java/org/springframework/ai/google/genai/GoogleGenAiChatModelIT.java b/models/spring-ai-google-genai/src/test/java/org/springframework/ai/google/genai/GoogleGenAiChatModelIT.java
@@ -29,6 +29,8 @@
 import org.junit.jupiter.api.Test;
 import org.junit.jupiter.api.condition.EnabledIfEnvironmentVariable;
 
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 import org.springframework.ai.chat.client.ChatClient;
 import org.springframework.ai.chat.messages.AssistantMessage;
 import org.springframework.ai.chat.messages.Message;
@@ -65,6 +67,8 @@
 @EnabledIfEnvironmentVariable(named = "GOOGLE_CLOUD_LOCATION", matches = ".*")
 class GoogleGenAiChatModelIT {
 
+	private static final Logger logger = LoggerFactory.getLogger(GoogleGenAiChatModelIT.class);
+
 	@Autowired
 	private GoogleGenAiChatModel chatModel;
 
@@ -384,6 +388,102 @@ void jsonTextToolCallingTest() {
 		assertThat(response).contains("2025-05-08T10:10:10+02:00");
 	}
 
+	@Test
+	void testThinkingBudgetGeminiProAutomaticDecisionByModel() {
+		GoogleGenAiChatModel chatModelWithThinkingBudget = GoogleGenAiChatModel.builder()
+			.genAiClient(genAiClient())
+			.defaultOptions(GoogleGenAiChatOptions.builder().model(ChatModel.GEMINI_2_5_PRO).temperature(0.1).build())
+			.build();
+
+		ChatClient chatClient = ChatClient.builder(chatModelWithThinkingBudget).build();
+
+		// Create a prompt that will trigger the tool call with a specific request that
+		// should invoke the tool
+		long start = System.currentTimeMillis();
+		String response = chatClient.prompt()
+			.user("Explain to me briefly how I can start a SpringAI project")
+			.call()
+			.content();
+
+		assertThat(response).isNotEmpty();
+		logger.info("Response: {} in {} ms", response, System.currentTimeMillis() - start);
+	}
+
+	@Test
+	void testThinkingBudgetGeminiProMinBudget() {
+		GoogleGenAiChatModel chatModelWithThinkingBudget = GoogleGenAiChatModel.builder()
+			.genAiClient(genAiClient())
+			.defaultOptions(GoogleGenAiChatOptions.builder()
+				.model(ChatModel.GEMINI_2_5_PRO)
+				.temperature(0.1)
+				.thinkingBudget(128)
+				.build())
+			.build();
+
+		ChatClient chatClient = ChatClient.builder(chatModelWithThinkingBudget).build();
+
+		// Create a prompt that will trigger the tool call with a specific request that
+		// should invoke the tool
+		long start = System.currentTimeMillis();
+		String response = chatClient.prompt()
+			.user("Explain to me briefly how I can start a SpringAI project")
+			.call()
+			.content();
+
+		assertThat(response).isNotEmpty();
+		logger.info("Response: {} in {} ms", response, System.currentTimeMillis() - start);
+	}
+
+	@Test
+	void testThinkingBudgetGeminiFlashDefaultBudget() {
+		GoogleGenAiChatModel chatModelWithThinkingBudget = GoogleGenAiChatModel.builder()
+			.genAiClient(genAiClient())
+			.defaultOptions(GoogleGenAiChatOptions.builder()
+				.model(ChatModel.GEMINI_2_5_FLASH)
+				.temperature(0.1)
+				.thinkingBudget(8192)
+				.build())
+			.build();
+
+		ChatClient chatClient = ChatClient.builder(chatModelWithThinkingBudget).build();
+
+		// Create a prompt that will trigger the tool call with a specific request that
+		// should invoke the tool
+		long start = System.currentTimeMillis();
+		String response = chatClient.prompt()
+			.user("Explain to me briefly how I can start a SpringAI project")
+			.call()
+			.content();
+
+		assertThat(response).isNotEmpty();
+		logger.info("Response: {} in {} ms", response, System.currentTimeMillis() - start);
+	}
+
+	@Test
+	void testThinkingBudgetGeminiFlashThinkingTurnedOff() {
+		GoogleGenAiChatModel chatModelWithThinkingBudget = GoogleGenAiChatModel.builder()
+			.genAiClient(genAiClient())
+			.defaultOptions(GoogleGenAiChatOptions.builder()
+				.model(ChatModel.GEMINI_2_5_FLASH)
+				.temperature(0.1)
+				.thinkingBudget(0)
+				.build())
+			.build();
+
+		ChatClient chatClient = ChatClient.builder(chatModelWithThinkingBudget).build();
+
+		// Create a prompt that will trigger the tool call with a specific request that
+		// should invoke the tool
+		long start = System.currentTimeMillis();
+		String response = chatClient.prompt()
+			.user("Explain to me briefly how I can start a SpringAI project")
+			.call()
+			.content();
+
+		assertThat(response).isNotEmpty();
+		logger.info("Response: {} in {} ms", response, System.currentTimeMillis() - start);
+	}
+
 	/**
 	 * Tool class that returns a JSON array to test the jsonToStruct method's ability to
 	 * handle JSON arrays. This specifically tests the PR changes that improve the
diff --git a/models/spring-ai-google-genai/src/test/java/org/springframework/ai/google/genai/GoogleGenAiChatOptionsTest.java b/models/spring-ai-google-genai/src/test/java/org/springframework/ai/google/genai/GoogleGenAiChatOptionsTest.java