spring-projects
diff --git a/‎models/spring-ai-vertex-ai/src/main/java/org/springframework/ai/vertex/VertexAiChatClient.java
Lines changed: 44 additions & 34 deletions b/‎models/spring-ai-vertex-ai/src/main/java/org/springframework/ai/vertex/VertexAiChatClient.java
Lines changed: 44 additions & 34 deletions
diff --git a/‎models/spring-ai-vertex-ai/src/main/java/org/springframework/ai/vertex/VertexAiChatOptions.java
Lines changed: 134 additions & 0 deletions b/‎models/spring-ai-vertex-ai/src/main/java/org/springframework/ai/vertex/VertexAiChatOptions.java
Lines changed: 134 additions & 0 deletions
diff --git a/‎models/spring-ai-vertex-ai/src/main/java/org/springframework/ai/vertex/api/VertexAiApi.java
Lines changed: 5 additions & 4 deletions b/‎models/spring-ai-vertex-ai/src/main/java/org/springframework/ai/vertex/api/VertexAiApi.java
Lines changed: 5 additions & 4 deletions
diff --git a/‎models/spring-ai-vertex-ai/src/test/java/org/springframework/ai/vertex/generation/VertexAiChatGenerationClientIT.java renamed to ‎models/spring-ai-vertex-ai/src/test/java/org/springframework/ai/vertex/VertexAiChatGenerationClientIT.java
Lines changed: 6 additions & 7 deletions b/‎models/spring-ai-vertex-ai/src/test/java/org/springframework/ai/vertex/generation/VertexAiChatGenerationClientIT.java renamed to ‎models/spring-ai-vertex-ai/src/test/java/org/springframework/ai/vertex/VertexAiChatGenerationClientIT.java
Lines changed: 6 additions & 7 deletions
@@ -20,9 +20,11 @@
 import java.util.stream.Collectors;
 
 import org.springframework.ai.chat.ChatClient;
+import org.springframework.ai.chat.ChatOptions;
 import org.springframework.ai.chat.ChatResponse;
 import org.springframework.ai.chat.Generation;
 import org.springframework.ai.chat.prompt.Prompt;
+import org.springframework.ai.model.ModelOptionsUtils;
 import org.springframework.ai.chat.messages.MessageType;
 import org.springframework.ai.vertex.api.VertexAiApi;
 import org.springframework.ai.vertex.api.VertexAiApi.GenerateMessageRequest;
@@ -38,40 +40,40 @@ public class VertexAiChatClient implements ChatClient {
 
 	private final VertexAiApi vertexAiApi;
 
-	private Float temperature;
+	private final VertexAiChatOptions defaultOptions;
 
-	private Float topP;
-
-	private Integer topK;
+	public VertexAiChatClient(VertexAiApi vertexAiApi) {
+		this(vertexAiApi,
+				VertexAiChatOptions.builder().withTemperature(0.7f).withCandidateCount(1).withTopK(20).build());
+	}
 
-	private Integer candidateCount;
+	public VertexAiChatClient(VertexAiApi vertexAiApi, VertexAiChatOptions defaultOptions) {
+		Assert.notNull(defaultOptions, "Default options must not be null!");
+		Assert.notNull(vertexAiApi, "VertexAiApi must not be null!");
 
-	public VertexAiChatClient(VertexAiApi vertexAiApi) {
 		this.vertexAiApi = vertexAiApi;
+		this.defaultOptions = defaultOptions;
 	}
 
-	public VertexAiChatClient withTemperature(Float temperature) {
-		this.temperature = temperature;
-		return this;
-	}
+	@Override
+	public ChatResponse call(Prompt prompt) {
 
-	public VertexAiChatClient withTopP(Float topP) {
-		this.topP = topP;
-		return this;
-	}
+		GenerateMessageRequest request = createRequest(prompt);
 
-	public VertexAiChatClient withTopK(Integer topK) {
-		this.topK = topK;
-		return this;
-	}
+		GenerateMessageResponse response = this.vertexAiApi.generateMessage(request);
 
-	public VertexAiChatClient withCandidateCount(Integer maxTokens) {
-		this.candidateCount = maxTokens;
-		return this;
+		List<Generation> generations = response.candidates()
+			.stream()
+			.map(vmsg -> new Generation(vmsg.content()))
+			.toList();
+
+		return new ChatResponse(generations);
 	}
 
-	@Override
-	public ChatResponse call(Prompt prompt) {
+	/**
+	 * Accessible for testing.
+	 */
+	GenerateMessageRequest createRequest(Prompt prompt) {
 
 		String vertexContext = prompt.getInstructions()
 			.stream()
@@ -89,17 +91,25 @@ public ChatResponse call(Prompt prompt) {
 
 		var vertexPrompt = new MessagePrompt(vertexContext, vertexMessages);
 
-		GenerateMessageRequest request = new GenerateMessageRequest(vertexPrompt, this.temperature, this.candidateCount,
-				this.topP, this.topK);
-
-		GenerateMessageResponse response = this.vertexAiApi.generateMessage(request);
-
-		List<Generation> generations = response.candidates()
-			.stream()
-			.map(vmsg -> new Generation(vmsg.content()))
-			.toList();
-
-		return new ChatResponse(generations);
+		GenerateMessageRequest request = new GenerateMessageRequest(vertexPrompt);
+
+		if (this.defaultOptions != null) {
+			request = ModelOptionsUtils.merge(request, this.defaultOptions, GenerateMessageRequest.class);
+		}
+
+		if (prompt.getOptions() != null) {
+			if (prompt.getOptions() instanceof ChatOptions runtimeOptions) {
+				VertexAiChatOptions updatedRuntimeOptions = ModelOptionsUtils.copyToTarget(runtimeOptions,
+						ChatOptions.class, VertexAiChatOptions.class);
+				request = ModelOptionsUtils.merge(updatedRuntimeOptions, request, GenerateMessageRequest.class);
+			}
+			else {
+				throw new IllegalArgumentException("Prompt options are not of type ChatOptions: "
+						+ prompt.getOptions().getClass().getSimpleName());
+			}
+		}
+
+		return request;
 	}
 
 }
@@ -0,0 +1,134 @@
+/*
+ * Copyright 2024-2024 the original author or authors.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      https://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.springframework.ai.vertex;
+
+import com.fasterxml.jackson.annotation.JsonInclude;
+import com.fasterxml.jackson.annotation.JsonInclude.Include;
+import com.fasterxml.jackson.annotation.JsonProperty;
+
+import org.springframework.ai.chat.ChatOptions;
+
+/**
+ * @author Christian Tzolov
+ */
+@JsonInclude(Include.NON_NULL)
+public class VertexAiChatOptions implements ChatOptions {
+
+	// @formatter:off
+	/**
+	 * Controls the randomness of the output. Values can range over [0.0,1.0], inclusive.
+	 * A value closer to 1.0 will produce responses that are more varied, while a value
+	 * closer to 0.0 will typically result in less surprising responses from the
+	 * generative. This value specifies default to be used by the backend while making the
+	 * call to the generative.
+	 */
+	private @JsonProperty("temperature") Float temperature;
+
+	/**
+	 * The number of generated response messages to return. This value must be between [1,
+	 * 8], inclusive. Defaults to 1.
+	 */
+	private @JsonProperty("candidateCount") Integer candidateCount;
+
+	/**
+	 * The maximum cumulative probability of tokens to consider when sampling. The
+	 * generative uses combined Top-k and nucleus sampling. Nucleus sampling considers the
+	 * smallest set of tokens whose probability sum is at least topP.
+	 */
+	private @JsonProperty("topP") Float topP;
+
+	/**
+	 * The maximum number of tokens to consider when sampling. The generative uses
+	 * combined Top-k and nucleus sampling. Top-k sampling considers the set of topK most
+	 * probable tokens.
+	 */
+	private @JsonProperty("topK") Integer topK;
+	// @formatter:on
+
+	public static Builder builder() {
+		return new Builder();
+	}
+
+	public static class Builder {
+
+		private VertexAiChatOptions options = new VertexAiChatOptions();
+
+		public Builder withTemperature(Float temperature) {
+			this.options.temperature = temperature;
+			return this;
+		}
+
+		public Builder withCandidateCount(Integer candidateCount) {
+			this.options.candidateCount = candidateCount;
+			return this;
+		}
+
+		public Builder withTopP(Float topP) {
+			this.options.topP = topP;
+			return this;
+		}
+
+		public Builder withTopK(Integer topK) {
+			this.options.topK = topK;
+			return this;
+		}
+
+		public VertexAiChatOptions build() {
+			return this.options;
+		}
+
+	}
+
+	@Override
+	public Float getTemperature() {
+		return this.temperature;
+	}
+
+	@Override
+	public void setTemperature(Float temperature) {
+		this.temperature = temperature;
+	}
+
+	public Integer getCandidateCount() {
+		return this.candidateCount;
+	}
+
+	public void setCandidateCount(Integer candidateCount) {
+		this.candidateCount = candidateCount;
+	}
+
+	@Override
+	public Float getTopP() {
+		return this.topP;
+	}
+
+	@Override
+	public void setTopP(Float topP) {
+		this.topP = topP;
+	}
+
+	@Override
+	public Integer getTopK() {
+		return this.topK;
+	}
+
+	@Override
+	public void setTopK(Integer topK) {
+		this.topK = topK;
+	}
+
+}
@@ -107,7 +107,7 @@ public class VertexAiApi {
 
 	private final String apiKey;
 
-	private final String generateModel;
+	private final String chatModel;
 
 	private final String embeddingModel;
 
@@ -130,7 +130,7 @@ public VertexAiApi(String apiKey) {
 	public VertexAiApi(String baseUrl, String apiKey, String model, String embeddingModel,
 			RestClient.Builder restClientBuilder) {
 
-		this.generateModel = model;
+		this.chatModel = model;
 		this.embeddingModel = embeddingModel;
 		this.apiKey = apiKey;
 
@@ -165,11 +165,12 @@ public void handleError(ClientHttpResponse response) throws IOException {
 	 * @param request Request body.
 	 * @return Response body.
 	 */
+	@SuppressWarnings("null")
 	public GenerateMessageResponse generateMessage(GenerateMessageRequest request) {
 		Assert.notNull(request, "The request body can not be null.");
 
 		return this.restClient.post()
-			.uri("/models/{model}:generateMessage?key={apiKey}", this.generateModel, this.apiKey)
+			.uri("/models/{model}:generateMessage?key={apiKey}", this.chatModel, this.apiKey)
 			.body(request)
 			.retrieve()
 			.body(GenerateMessageResponse.class);
@@ -231,7 +232,7 @@ record TokenCount(@JsonProperty("tokenCount") Integer tokenCount) {
 		}
 
 		TokenCount tokenCountResponse = this.restClient.post()
-				.uri("/models/{model}:countMessageTokens?key={apiKey}", this.generateModel, this.apiKey)
+				.uri("/models/{model}:countMessageTokens?key={apiKey}", this.chatModel, this.apiKey)
 				.body(Map.of("prompt", prompt))
 				.retrieve()
 				.body(TokenCount.class);
 
@@ -1,4 +1,4 @@
-package org.springframework.ai.vertex.generation;
+package org.springframework.ai.vertex;
 
 import java.util.Arrays;
 import java.util.List;
@@ -9,15 +9,14 @@
 
 import org.springframework.ai.chat.ChatResponse;
 import org.springframework.ai.chat.Generation;
-import org.springframework.ai.parser.BeanOutputParser;
-import org.springframework.ai.parser.ListOutputParser;
-import org.springframework.ai.parser.MapOutputParser;
+import org.springframework.ai.chat.messages.Message;
+import org.springframework.ai.chat.messages.UserMessage;
 import org.springframework.ai.chat.prompt.Prompt;
 import org.springframework.ai.chat.prompt.PromptTemplate;
 import org.springframework.ai.chat.prompt.SystemPromptTemplate;
-import org.springframework.ai.chat.messages.Message;
-import org.springframework.ai.chat.messages.UserMessage;
-import org.springframework.ai.vertex.VertexAiChatClient;
+import org.springframework.ai.parser.BeanOutputParser;
+import org.springframework.ai.parser.ListOutputParser;
+import org.springframework.ai.parser.MapOutputParser;
 import org.springframework.ai.vertex.api.VertexAiApi;
 import org.springframework.beans.factory.annotation.Autowired;
 import org.springframework.beans.factory.annotation.Value;