SAP
diff --git a/‎README.md‎
Lines changed: 10 additions & 2 deletions b/‎README.md‎
Lines changed: 10 additions & 2 deletions
diff --git a/‎core/src/main/java/com/sap/ai/sdk/core/DeploymentCache.java‎
Lines changed: 2 additions & 6 deletions b/‎core/src/main/java/com/sap/ai/sdk/core/DeploymentCache.java‎
Lines changed: 2 additions & 6 deletions
diff --git a/‎core/src/test/java/com/sap/ai/sdk/core/CacheTest.java‎
Lines changed: 1 addition & 1 deletion b/‎core/src/test/java/com/sap/ai/sdk/core/CacheTest.java‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎core/src/test/java/com/sap/ai/sdk/core/client/DeploymentUnitTest.java‎
Lines changed: 11 additions & 9 deletions b/‎core/src/test/java/com/sap/ai/sdk/core/client/DeploymentUnitTest.java‎
Lines changed: 11 additions & 9 deletions
diff --git a/‎core/src/test/resources/__files/GPT4DeploymentResponse.json‎
Lines changed: 2 additions & 2 deletions b/‎core/src/test/resources/__files/GPT4DeploymentResponse.json‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/guides/OPENAI_CHAT_COMPLETION.md‎
Lines changed: 2 additions & 4 deletions b/‎docs/guides/OPENAI_CHAT_COMPLETION.md‎
Lines changed: 2 additions & 4 deletions
diff --git a/‎docs/guides/ORCHESTRATION_CHAT_COMPLETION.md‎
Lines changed: 72 additions & 100 deletions b/‎docs/guides/ORCHESTRATION_CHAT_COMPLETION.md‎
Lines changed: 72 additions & 100 deletions
@@ -251,7 +251,7 @@ For more detailed information and advanced usage, please refer to the following:
 
 ## FAQs
 
-### How to add a custom header to AI Core requests?
+### _"How to add a custom header to AI Core requests?"_
 
 To add a header to AI Core requests, use the following code:
 
@@ -262,7 +262,15 @@ DeploymentApi api = new DeploymentApi(client);
 
 For more customization, creating a [HeaderProvider](https://sap.github.io/cloud-sdk/docs/java/features/connectivity/http-destinations#about-headerproviders) is also possible.
 
-### More Examples
+
+### _"There's a vulnerability warning `CVE-2021-41251`?"_
+
+This is a known false-positive finding.
+Depending on the tooling any product called "SAP Cloud SDK" or similar with a low version number may be marked as vulnerable, incorrectly.
+Please consider suppressing the warning, [as we do](https://github.com/SAP/ai-sdk-java/blob/main/.pipeline/dependency-check-suppression.xml).
+
+
+### _"Are there any example projects?"_
 
 Explore example applications and code snippets:
 
 
@@ -135,13 +135,9 @@ protected static boolean isDeploymentOfModel(
     if (resources == null) {
       return false;
     }
-    Object detailsObject = resources.getBackendDetails();
-    // workaround for AIWDF-2124
+    final Object detailsObject = resources.getBackendDetails();
     if (detailsObject == null) {
-      if (!resources.getCustomFieldNames().contains("backend_details")) {
-        return false;
-      }
-      detailsObject = resources.getCustomField("backend_details");
+      return false;
     }
 
     if (detailsObject instanceof Map<?, ?> details
 
@@ -161,7 +161,7 @@ public void isDeploymentOfModel() {
             .createdAt(OffsetDateTime.parse("2024-01-22T17:57:23+00:00"))
             .modifiedAt(OffsetDateTime.parse("2024-02-08T08:41:23+00:00"));
     deployment.setDetails(AiDeploymentDetails.create().resources(AiResourcesDetails.create()));
-    deployment.getDetails().getResources().setCustomField("backend_details", model);
+    deployment.getDetails().getResources().setBackendDetails(model);
 
     // Check if the deployment is of the target model
     assertThat(DeploymentCache.isDeploymentOfModel(gpt4AnyVersion, deployment)).isTrue();
 
@@ -62,8 +62,7 @@ void getDeployments() {
                               "ttl": null,
                               "details": {
                                 "scaling": {
-                                  "backendDetails": {},
-                                  "backend_details": {}
+                                  "backendDetails": {}
                                 },
                                 "resources": {
                                   "backendDetails": {
@@ -104,7 +103,6 @@ void getDeployments() {
     assertThat(deployment.getDeploymentUrl())
         .isEqualTo(
             "https://api.ai.intprod-eu12.eu-central-1.aws.ml.hana.ondemand.com/v2/inference/deployments/d889e3a61050c085");
-    // Response contains key "backend_details" while spec (mistakenly) defines key "backendDetails".
     val expected = Map.of("model", Map.of("name", "gpt-4-32k", "version", "latest"));
     assertThat(deployment.getDetails().getResources().getBackendDetails()).isEqualTo(expected);
     assertThat(deployment.getDetails().getScaling().getBackendDetails()).isEqualTo(Map.of());
@@ -243,12 +241,12 @@ void getDeploymentById() {
                            "deploymentUrl": "https://api.ai.intprod-eu12.eu-central-1.aws.ml.hana.ondemand.com/v2/inference/deployments/db1d64d9f06be467",
                            "details": {
                              "resources": {
-                               "backend_details": {},
-                               "backendDetails": {}
+                               "backendDetails": {},
+                               "backend_details": {}
                              },
                              "scaling": {
-                               "backend_details": {},
-                               "backendDetails": {}
+                               "backendDetails": {},
+                               "backend_details": {}
                              }
                            },
                            "id": "db1d64d9f06be467",
@@ -272,8 +270,12 @@ void getDeploymentById() {
     assertThat(deployment.getDeploymentUrl())
         .isEqualTo(
             "https://api.ai.intprod-eu12.eu-central-1.aws.ml.hana.ondemand.com/v2/inference/deployments/db1d64d9f06be467");
-    assertThat(deployment.getDetails().getResources().getBackendDetails()).isNotNull();
-    assertThat(deployment.getDetails().getScaling().getBackendDetails()).isNotNull();
+    assertThat(deployment.getDetails().getResources().getBackendDetails()).isEqualTo(Map.of());
+    assertThat(deployment.getDetails().getResources().getCustomField("backend_details"))
+        .isEqualTo(Map.of());
+    assertThat(deployment.getDetails().getScaling().getBackendDetails()).isEqualTo(Map.of());
+    assertThat(deployment.getDetails().getScaling().getCustomField("backend_details"))
+        .isEqualTo(Map.of());
     assertThat(deployment.getId()).isEqualTo("db1d64d9f06be467");
     assertThat(deployment.getLastOperation())
         .isEqualTo(AiDeploymentResponseWithDetails.LastOperationEnum.CREATE);
 
@@ -8,15 +8,15 @@
       "deploymentUrl": "https://api.ai.intprod-eu12.eu-central-1.aws.ml.hana.ondemand.com/v2/inference/deployments/d19b998f347341aa",
       "details": {
         "resources": {
-          "backend_details": {
+          "backendDetails": {
             "model": {
               "name": "gpt-4-32k",
               "version": "latest"
             }
           }
         },
         "scaling": {
-          "backend_details": {}
+          "backendDetails": {}
         }
       },
       "id": "d19b998f347341aa",
 
@@ -65,12 +65,10 @@ In addition to the prerequisites above, we assume you have already set up the fo
         "ttl": null,
         "details": {
           "scaling": {
-            "backendDetails": null,
-            "backend_details": {}
+            "backendDetails": {}
           },
           "resources": {
-            "backendDetails": null,
-            "backend_details": {
+            "backendDetails": {
               "model": {
                 "name": "gpt-35-turbo",
                 "version": "latest"
 
@@ -68,90 +68,84 @@ In addition to the prerequisites above, we assume you have already set up the fo
       ```
 
       </details>
-    
-### Chat completion with Templates
 
-Use a chat completion template to generate a response in German:
+### Create a Client
+
+To use the Orchestration service, create a client and a configuration object:
 
 ```java
-var llmConfig = LLMModuleConfig.create().modelName("gpt-35-turbo").modelParams(Map.of());
+var client = new OrchestrationClient();
 
-var inputParams =
-    Map.of("input", "Reply with 'Orchestration Service is working!' in German");
-var template = ChatMessage.create().role("user").content("{{?input}}");
-var templatingConfig = TemplatingModuleConfig.create().template(template);
+var config = new OrchestrationModuleConfig()
+        .withLlmConfig(LLMModuleConfig.create().modelName("gpt-35-turbo").modelParams(Map.of()));
+```
+
+Please also refer to [our sample code](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/controllers/OrchestrationController.java) for this and all following code examples.
+  
+### Chat Completion
 
-var config =
-    CompletionPostRequest.create()
-        .orchestrationConfig(
-            OrchestrationConfig.create()
-                .moduleConfigurations(
-                    ModuleConfigs.create()
-                        .llmModuleConfig(llmConfig)
-                        .templatingModuleConfig(templatingConfig)))
-        .inputParams(inputParams);
+Use the Orchestration service to generate a response to a user message:
 
-CompletionPostResponse result =
-    new OrchestrationClient().chatCompletion(config);
+```java
+var prompt = new OrchestrationPrompt("Hello world! Why is this phrase so famous?");
+
+var result = client.chatCompletion(prompt, config);
 
 String messageResult =
-    result.getOrchestrationResult().getChoices().get(0).getMessage().getContent();
+        result.getOrchestrationResult().getChoices().get(0).getMessage().getContent();
 ```
 
-See [an example in our Spring Boot application](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/controllers/OrchestrationController.java)
+In this example, the Orchestration service generates a response to the user message "Hello world! Why is this phrase so famous?".
+The LLM response is available as the first choice under the `result.getOrchestrationResult()` object.
 
-### Message history
+### Chat completion with Templates
 
-Include a message history to maintain context in the conversation:
+Use a prepared template and execute requests with by passing only the input parameters:
 
 ```java
-var llmConfig = LLMModuleConfig.create().modelName("gpt-35-turbo").modelParams(Map.of());
+var template =
+    ChatMessage.create()
+        .role("user")
+        .content("Reply with 'Orchestration Service is working!' in {{?language}}");
+var templatingConfig = TemplatingModuleConfig.create().template(template);
+var configWithTemplate = config.withTemplateConfig(templatingConfig);
+
+var inputParams = Map.of("language", "German");
+var prompt = new OrchestrationPrompt(inputParams);
+
+var result = client.chatCompletion(prompt, configWithTemplate);
+```
+
+In this case the template is defined with the placeholder `{{?language}}` which is replaced by the value `German` in the input parameters.
+
+### Message history
 
-List<ChatMessage> messagesHistory =
-    List.of(
-        ChatMessage.create().role("user").content("What is the capital of France?"),
-        ChatMessage.create().role("assistant").content("The capital of France is Paris."));
+Include a message history to maintain context in the conversation:
 
+```java
+var messagesHistory =
+        List.of(
+                ChatMessage.create().role("user").content("What is the capital of France?"),
+                ChatMessage.create().role("assistant").content("The capital of France is Paris."));
 var message =
-    ChatMessage.create().role("user").content("What is the typical food there?");
-var templatingConfig = TemplatingModuleConfig.create().template(message);
-
-var config =
-    CompletionPostRequest.create()
-        .orchestrationConfig(
-            OrchestrationConfig.create()
-                .moduleConfigurations(
-                    ModuleConfigs.create()
-                        .llmModuleConfig(llmConfig)
-                        .templatingModuleConfig(templatingConfig)))
-        .messagesHistory(messagesHistory);
-
-CompletionPostResponse result =
-    new OrchestrationClient().chatCompletion(config);
+        ChatMessage.create().role("user").content("What is the typical food there?");
 
-String messageResult =
-    result.getOrchestrationResult().getChoices().get(0).getMessage().getContent();
-```
+var prompt = new OrchestrationPrompt(message).messageHistory(messagesHistory);
 
-See [an example in our Spring Boot application](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/controllers/OrchestrationController.java)
+var result = new OrchestrationClient().chatCompletion(prompt, config);
+```
 
 ### Chat completion filter
 
 Apply content filtering to the chat completion:
 
 ```java
-var llmConfig = LLMModuleConfig.create().modelName("gpt-35-turbo").modelParams(Map.of());
-
-var inputParams =
-    Map.of(
-        "disclaimer",
-        "```DISCLAIMER: The area surrounding the apartment is known for prostitutes and gang violence including armed conflicts, gun violence is frequent.");
-var template =
-    ChatMessage.create()
-        .role("user")
-        .content(
-            "Create a rental posting for subletting my apartment in the downtown area. Keep it short. Make sure to add the following disclaimer to the end. Do not change it! {{?disclaimer}}");
-var templatingConfig = TemplatingModuleConfig.create().template(template);
+var prompt = new OrchestrationPrompt(
+        """
+        Create a rental posting for subletting my apartment in the downtown area. Keep it short. Make sure to add the following disclaimer to the end. Do not change it!
+        
+        ```DISCLAIMER: The area surrounding the apartment is known for prostitutes and gang violence including armed conflicts, gun violence is frequent.
+        """);
 
 var filterStrict = 
     FilterConfig.create()
@@ -176,40 +170,21 @@ var filterLoose =
 var filteringConfig =
     FilteringModuleConfig.create()
         // changing the input to filterLoose will allow the message to pass
-        .input(FilteringConfig.create().filters(filterStrict))
-        .output(FilteringConfig.create().filters(filterStrict));
-
-var config =
-    CompletionPostRequest.create()
-        .orchestrationConfig(
-            OrchestrationConfig.create()
-                .moduleConfigurations(
-                    ModuleConfigs.create()
-                        .llmModuleConfig(llmConfig)
-                        .templatingModuleConfig(templatingConfig)
-                        .filteringModuleConfig(filteringConfig)))
-        .inputParams(inputParams);
+        .input(InputFilteringConfig.create().filters(filterStrict))
+        .output(OutputFilteringConfig.create().filters(filterStrict));
 
-// this fails with Bad Request because the strict filter prohibits the input message
-CompletionPostResponse result =
-    new OrchestrationClient().chatCompletion(config);
+var configWithFilter = config.withFilteringConfig(filteringConfig);
 
-String messageResult =
-    result.getOrchestrationResult().getChoices().get(0).getMessage().getContent();
+// this fails with Bad Request because the strict filter prohibits the input message
+var result =
+    new OrchestrationClient().chatCompletion(prompt, configWithFilter);
 ```
 
-See [an example in our Spring Boot application](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/controllers/OrchestrationController.java)
-
 ### Data masking
 
 Use the data masking module to anonymize personal information in the input:
 
 ```java
-var inputParams = Map.of("privateInfo", "Patrick Morgan +49 (970) 333-3833");
-var template =
-    ChatMessage.create().role("user").content("What is the nationality of {{?privateInfo}}");
-var templatingConfig = TemplatingModuleConfig.create().template(template);
-
 var maskingProvider =
     MaskingProviderConfig.create()
         .type(MaskingProviderConfig.TypeEnum.SAP_DATA_PRIVACY_INTEGRATION)
@@ -218,29 +193,26 @@ var maskingProvider =
             DPIEntityConfig.create().type(DPIEntities.PHONE),
             DPIEntityConfig.create().type(DPIEntities.PERSON));
 var maskingConfig = MaskingModuleConfig.create().maskingProviders(maskingProvider);
+var configWithMasking = config.withMaskingConfig(maskingConfig);
 
-CompletionPostRequest config =
-    CompletionPostRequest.create()
-        .orchestrationConfig(
-            OrchestrationConfig.create()
-                .moduleConfigurations(
-                    ModuleConfigs.create()
-                        .llmModuleConfig(LLM_CONFIG)
-                        .templatingModuleConfig(templatingConfig)
-                        .maskingModuleConfig(maskingConfig)))
-        .inputParams(inputParams);
+var systemMessage = ChatMessage.create()
+        .role("system")
+        .content("Please evaluate the following user feedback and judge if the sentiment is positive or negative.");
+var userMessage = ChatMessage.create()
+        .role("user")
+        .content("""
+                 I think the SDK is good, but could use some further enhancements.
+                 My architect Alice and manager Bob pointed out that we need the grounding capabilities, which aren't supported yet.
+                 """);
 
-CompletionPostResponse result =
-    new OrchestrationClient().chatCompletion(config);
+var prompt = new OrchestrationPrompt(systemMessage, userMessage);
 
-String messageResult =
-    result.getOrchestrationResult().getChoices().get(0).getMessage().getContent();
+var result =
+    new OrchestrationClient().chatCompletion(prompt, configWithMasking);
 ```
 
 In this example, the input will be masked before the call to the LLM. Note that data cannot be unmasked in the LLM output.
 
-See [an example in our Spring Boot application](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/controllers/OrchestrationController.java)
-
 ### Set model parameters
 
 Change your LLM module configuration to add model parameters:
Original file line number	Diff line number	Diff line change
`@@ -8,15 +8,15 @@`
`8`	`8`	`"deploymentUrl": "https://api.ai.intprod-eu12.eu-central-1.aws.ml.hana.ondemand.com/v2/inference/deployments/d19b998f347341aa",`
`9`	`9`	`"details": {`
`10`	`10`	`"resources": {`
`11`		`- "backend_details": {`
	`11`	`+ "backendDetails": {`
`12`	`12`	`"model": {`
`13`	`13`	`"name": "gpt-4-32k",`
`14`	`14`	`"version": "latest"`
`15`	`15`	`}`
`16`	`16`	`}`
`17`	`17`	`},`
`18`	`18`	`"scaling": {`
`19`		`- "backend_details": {}`
	`19`	`+ "backendDetails": {}`
`20`	`20`	`}`
`21`	`21`	`},`
`22`	`22`	`"id": "d19b998f347341aa",`