Add taskSettings parameter to LlamaChatCompletionModel and LlamaEmbeddingsModel for enhanced customization

Jan-Kazlouski-elastic · Jan-Kazlouski-elastic · commit fe90810f838f · 2025-07-24T16:23:54.000+03:00
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/completion/LlamaChatCompletionModel.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/completion/LlamaChatCompletionModel.java
@@ -33,6 +33,7 @@ public class LlamaChatCompletionModel extends LlamaModel {
      * @param taskType the type of task this model is designed for
      * @param service the name of the inference service
      * @param serviceSettings the settings for the inference service, specific to chat completion
+     * @param taskSettings the settings for the task, such as user or other parameters
      * @param secrets the secret settings for the model, such as API keys or tokens
      * @param context the context for parsing configuration settings
      */
@@ -61,6 +62,7 @@ public LlamaChatCompletionModel(
      * @param taskType the type of task this model is designed for
      * @param service the name of the inference service
      * @param serviceSettings the settings for the inference service, specific to chat completion
+     * @param taskSettings the settings for the task, such as user or other parameters
      * @param secrets the secret settings for the model, such as API keys or tokens
      */
     public LlamaChatCompletionModel(
@@ -75,6 +77,14 @@ public LlamaChatCompletionModel(
         setPropertiesFromServiceSettings(serviceSettings);
     }
 
+    /**
+     * Factory method to create a LlamaChatCompletionModel with overridden task settings based on the request.
+     * If the request does not specify task settings, the original model is returned.
+     *
+     * @param model the original LlamaChatCompletionModel
+     * @param taskSettings the task settings to override, which may include parameters like user
+     * @return a new LlamaChatCompletionModel with overridden task settings or the original model if no overrides are specified
+     */
     public static LlamaChatCompletionModel of(LlamaChatCompletionModel model, Map<String, Object> taskSettings) {
         if (taskSettings == null || taskSettings.isEmpty()) {
             return model;
diff --git a/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/embeddings/LlamaEmbeddingsModel.java b/x-pack/plugin/inference/src/main/java/org/elasticsearch/xpack/inference/services/llama/embeddings/LlamaEmbeddingsModel.java
@@ -34,6 +34,8 @@ public class LlamaEmbeddingsModel extends LlamaModel {
      * @param taskType the type of task this model is designed for
      * @param service the name of the inference service
      * @param serviceSettings the settings for the inference service, specific to embeddings
+     * @param taskSettings the settings for the task, such as user or other parameters
+     * @param chunkingSettings the chunking settings for processing input data
      * @param secrets the secret settings for the model, such as API keys or tokens
      * @param context the context for parsing configuration settings
      */
@@ -86,6 +88,7 @@ private void setPropertiesFromServiceSettings(LlamaEmbeddingsServiceSettings ser
      * @param taskType the type of task this model is designed for
      * @param service the name of the inference service
      * @param serviceSettings the settings for the inference service, specific to embeddings
+     * @param taskSettings the settings for the task, such as user or other parameters
      * @param chunkingSettings the chunking settings for processing input data
      * @param secrets the secret settings for the model, such as API keys or tokens
      */
@@ -105,6 +108,14 @@ public LlamaEmbeddingsModel(
         setPropertiesFromServiceSettings(serviceSettings);
     }
 
+    /**
+     * Factory method to create a LlamaEmbeddingsModel with overridden task settings based on the request.
+     * If the request does not specify task settings, the original model is returned.
+     *
+     * @param model the original LlamaEmbeddingsModel
+     * @param taskSettings the task settings to override, which may include parameters like user
+     * @return a new LlamaEmbeddingsModel with overridden task settings or the original model if no overrides are specified
+     */
     public static LlamaEmbeddingsModel of(LlamaEmbeddingsModel model, Map<String, Object> taskSettings) {
         if (taskSettings == null || taskSettings.isEmpty()) {
             return model;