SAP
diff --git a/‎docs/guides/ORCHESTRATION_CHAT_COMPLETION.md‎
Lines changed: 69 additions & 0 deletions b/‎docs/guides/ORCHESTRATION_CHAT_COMPLETION.md‎
Lines changed: 69 additions & 0 deletions
diff --git a/‎docs/release-notes/release_notes.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/release-notes/release_notes.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎orchestration/src/main/java/com/sap/ai/sdk/orchestration/ConfigToRequestTransformer.java‎
Lines changed: 2 additions & 1 deletion b/‎orchestration/src/main/java/com/sap/ai/sdk/orchestration/ConfigToRequestTransformer.java‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎orchestration/src/test/java/com/sap/ai/sdk/orchestration/OrchestrationUnitTest.java‎
Lines changed: 123 additions & 24 deletions b/‎orchestration/src/test/java/com/sap/ai/sdk/orchestration/OrchestrationUnitTest.java‎
Lines changed: 123 additions & 24 deletions
diff --git a/‎orchestration/src/test/resources/__files/jsonObjectResponse.json‎
Lines changed: 59 additions & 0 deletions b/‎orchestration/src/test/resources/__files/jsonObjectResponse.json‎
Lines changed: 59 additions & 0 deletions
@@ -12,6 +12,8 @@
     - [Data Masking](#data-masking)
     - [Grounding](#grounding)
     - [Stream chat completion](#stream-chat-completion)
+    - [Add images and multiple text inputs to a message](#add-images-and-multiple-text-inputs-to-a-message)
+    - [Set a Response Format](#set-a-response-format)
     - [Set Model Parameters](#set-model-parameters)
     - [Using a Configuration from AI Launchpad](#using-a-configuration-from-ai-launchpad)
 
@@ -300,6 +302,73 @@ Note, that only user and system messages are supported for multiple text inputs.
 Please find [an example in our Spring Boot application](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/services/OrchestrationService.java).
 
 
+## Set a Response Format
+
+It is possible to set the response format for the chat completion. Available options are using `JSON_OBJECT`, `JSON_SCHEMA`, and `TEXT`, where `TEXT` is the default behavior.
+
+### JSON_OBJECT
+
+Setting the response format to `JSON_OBJECT` tells the AI to respond with JSON, i.e., the response from the AI will be a string consisting of a valid JSON. This does, however, not guarantee that the response adheres to a specific structure (other than being valid JSON).
+
+```java
+var template = Message.user("What is 'apple' in German?");
+var templatingConfig =
+        Template.create()
+                .template(List.of(template.createChatMessage()))
+                .responseFormat(
+                        ResponseFormatJsonObject.create()
+                                .type(ResponseFormatJsonObject.TypeEnum.JSON_OBJECT));
+var configWithTemplate = llmWithImageSupportConfig.withTemplateConfig(templatingConfig);
+
+var prompt =
+        new OrchestrationPrompt(
+                Message.system(
+                        "You are a language translator. Answer using the following JSON format: {\"language\": ..., \"translation\": ...}"));
+var response = client.chatCompletion(prompt, configWithTemplate).getContent();
+```
+Note, that it is necessary to tell the AI model to actually return a JSON object in the prompt. The result might not adhere exactly to the given JSON format, but it will be a JSON object.
+
+
+### JSON_SCHEMA
+
+If you want the response to not only consist of valid JSON but additionally adhere to a specific JSON schema, you can use `JSON_SCHEMA`. in order to do that, add a JSON schema to the configuration as shown below and the response will adhere to the given schema.
+
+```java
+var template = Message.user("Whats '%s' in German?".formatted(word));
+var schema =
+        Map.of(
+                "type",
+                "object",
+                "properties",
+                Map.of(
+                        "language", Map.of("type", "string"),
+                        "translation", Map.of("type", "string")),
+                "required",
+                List.of("language", "translation"),
+                "additionalProperties",
+                false);
+
+// Note, that we plan to add more convenient ways to add a JSON schema in the future.
+var templatingConfig =
+        Template.create()
+                .template(List.of(template.createChatMessage()))
+                .responseFormat(
+                        ResponseFormatJsonSchema.create()
+                                .type(ResponseFormatJsonSchema.TypeEnum.JSON_SCHEMA)
+                                .jsonSchema(
+                                        ResponseFormatJsonSchemaJsonSchema.create()
+                                                .name("translation_response")
+                                                .schema(schema)
+                                                .strict(true)
+                                                .description("Output schema for language translation.")));
+var configWithTemplate = llmWithImageSupportConfig.withTemplateConfig(templatingConfig);
+
+var prompt = new OrchestrationPrompt(Message.system("You are a language translator."));
+var response = client.chatCompletion(prompt, configWithTemplate).getContent();
+```
+
+Please find [an example in our Spring Boot application](../../sample-code/spring-app/src/main/java/com/sap/ai/sdk/app/services/OrchestrationService.java)
+
 ## Set model parameters
 
 Change your LLM configuration to add model parameters:
 
@@ -16,6 +16,7 @@
 - Orchestration:
   - [Add `LlamaGuardFilter`](https://github.com/SAP/ai-sdk-java/tree/main/docs/guides/ORCHESTRATION_CHAT_COMPLETION.md#chat-completion-filter).
   - [Convenient methods to create messages containing images and multiple text inputs](https://github.com/SAP/ai-sdk-java/tree/main/docs/guides/ORCHESTRATION_CHAT_COMPLETION.md#add-images-and-multiple-text-inputs-to-a-message)
+  - [Enable setting the response format](https://github.com/SAP/ai-sdk-java/tree/main/docs/guides/ORCHESTRATION_CHAT_COMPLETION.md#set-a-response-format)
 
 ### 📈 Improvements
 
 
@@ -49,14 +49,15 @@ static TemplatingModuleConfig toTemplateModuleConfig(
      * To be fixed with https://github.tools.sap/AI/llm-orchestration/issues/662
      */
     val messages = template instanceof Template t ? t.getTemplate() : List.<ChatMessage>of();
+    val responseFormat = template instanceof Template t ? t.getResponseFormat() : null;
     val messagesWithPrompt = new ArrayList<>(messages);
     messagesWithPrompt.addAll(
         prompt.getMessages().stream().map(Message::createChatMessage).toList());
     if (messagesWithPrompt.isEmpty()) {
       throw new IllegalStateException(
           "A prompt is required. Pass at least one message or configure a template with messages or a template reference.");
     }
-    return Template.create().template(messagesWithPrompt);
+    return Template.create().template(messagesWithPrompt).responseFormat(responseFormat);
   }
 
   @Nonnull
 
@@ -44,9 +44,14 @@
 import com.sap.ai.sdk.orchestration.model.KeyValueListPair;
 import com.sap.ai.sdk.orchestration.model.LLMModuleResultSynchronous;
 import com.sap.ai.sdk.orchestration.model.LlamaGuard38b;
+import com.sap.ai.sdk.orchestration.model.ResponseFormatJsonObject;
+import com.sap.ai.sdk.orchestration.model.ResponseFormatJsonSchema;
+import com.sap.ai.sdk.orchestration.model.ResponseFormatJsonSchemaJsonSchema;
+import com.sap.ai.sdk.orchestration.model.ResponseFormatText;
 import com.sap.ai.sdk.orchestration.model.SearchDocumentKeyValueListPair;
 import com.sap.ai.sdk.orchestration.model.SearchSelectOptionEnum;
 import com.sap.ai.sdk.orchestration.model.SingleChatMessage;
+import com.sap.ai.sdk.orchestration.model.Template;
 import com.sap.cloud.sdk.cloudplatform.connectivity.ApacheHttpClient5Accessor;
 import com.sap.cloud.sdk.cloudplatform.connectivity.ApacheHttpClient5Cache;
 import com.sap.cloud.sdk.cloudplatform.connectivity.DefaultHttpDestination;
@@ -58,6 +63,7 @@
 import java.util.function.Function;
 import java.util.stream.Stream;
 import javax.annotation.Nonnull;
+import lombok.val;
 import org.apache.hc.client5.http.classic.HttpClient;
 import org.apache.hc.core5.http.ContentType;
 import org.apache.hc.core5.http.io.entity.InputStreamEntity;
@@ -734,46 +740,22 @@ void testMultiMessage() throws IOException {
             "Well, this image features the logo of SAP, a software company, set against a gradient blue background transitioning from light to dark. The main color in the image is blue.");
 
     assertThat(response).isNotNull();
-    assertThat(response.getRequestId()).isEqualTo("8d973a0d-c2cf-437b-a765-08d66bf446d8");
-    assertThat(response.getModuleResults()).isNotNull();
-    assertThat(response.getModuleResults().getTemplating()).hasSize(2);
-
     var llmResults = (LLMModuleResultSynchronous) response.getModuleResults().getLlm();
     assertThat(llmResults).isNotNull();
-    assertThat(llmResults.getId()).isEqualTo("chatcmpl-AyGx4yLYUH79TK81i21BaABoUpf4v");
-    assertThat(llmResults.getObject()).isEqualTo("chat.completion");
-    assertThat(llmResults.getCreated()).isEqualTo(1738928206);
-    assertThat(llmResults.getModel()).isEqualTo("gpt-4o-mini-2024-07-18");
-    assertThat(llmResults.getSystemFingerprint()).isEqualTo("fp_f3927aa00d");
     assertThat(llmResults.getChoices()).hasSize(1);
     assertThat(llmResults.getChoices().get(0).getMessage().getContent())
         .isEqualTo(
             "Well, this image features the logo of SAP, a software company, set against a gradient blue background transitioning from light to dark. The main color in the image is blue.");
     assertThat(llmResults.getChoices().get(0).getFinishReason()).isEqualTo("stop");
     assertThat(llmResults.getChoices().get(0).getMessage().getRole()).isEqualTo("assistant");
-    assertThat(llmResults.getChoices().get(0).getIndex()).isZero();
-    assertThat(llmResults.getUsage().getCompletionTokens()).isEqualTo(35);
-    assertThat(llmResults.getUsage().getPromptTokens()).isEqualTo(250);
-    assertThat(llmResults.getUsage().getTotalTokens()).isEqualTo(285);
-
     var orchestrationResult = (LLMModuleResultSynchronous) response.getOrchestrationResult();
-    assertThat(orchestrationResult).isNotNull();
-    assertThat(orchestrationResult.getId()).isEqualTo("chatcmpl-AyGx4yLYUH79TK81i21BaABoUpf4v");
-    assertThat(orchestrationResult.getObject()).isEqualTo("chat.completion");
-    assertThat(orchestrationResult.getCreated()).isEqualTo(1738928206);
-    assertThat(orchestrationResult.getModel()).isEqualTo("gpt-4o-mini-2024-07-18");
-    assertThat(orchestrationResult.getSystemFingerprint()).isEqualTo("fp_f3927aa00d");
     assertThat(orchestrationResult.getChoices()).hasSize(1);
     assertThat(orchestrationResult.getChoices().get(0).getMessage().getContent())
         .isEqualTo(
             "Well, this image features the logo of SAP, a software company, set against a gradient blue background transitioning from light to dark. The main color in the image is blue.");
     assertThat(orchestrationResult.getChoices().get(0).getFinishReason()).isEqualTo("stop");
     assertThat(orchestrationResult.getChoices().get(0).getMessage().getRole())
         .isEqualTo("assistant");
-    assertThat(orchestrationResult.getChoices().get(0).getIndex()).isZero();
-    assertThat(orchestrationResult.getUsage().getCompletionTokens()).isEqualTo(35);
-    assertThat(orchestrationResult.getUsage().getPromptTokens()).isEqualTo(250);
-    assertThat(orchestrationResult.getUsage().getTotalTokens()).isEqualTo(285);
 
     try (var requestInputStream = fileLoader.apply("multiMessageRequest.json")) {
       final String requestBody = new String(requestInputStream.readAllBytes());
@@ -782,4 +764,121 @@ void testMultiMessage() throws IOException {
               .withRequestBody(equalToJson(requestBody)));
     }
   }
+
+  @Test
+  void testResponseObjectJsonSchema() throws IOException {
+    stubFor(
+        post(anyUrl())
+            .willReturn(
+                aResponse()
+                    .withBodyFile("jsonSchemaResponse.json")
+                    .withHeader("Content-Type", "application/json")));
+
+    var llmWithImageSupportConfig = new OrchestrationModuleConfig().withLlmConfig(GPT_4O_MINI);
+
+    val template = Message.user("Whats 'apple' in German?");
+    var schema =
+        Map.of(
+            "type",
+            "object",
+            "properties",
+            Map.of(
+                "language", Map.of("type", "string"),
+                "translation", Map.of("type", "string")),
+            "required",
+            List.of("language", "translation"),
+            "additionalProperties",
+            false);
+
+    val templatingConfig =
+        Template.create()
+            .template(List.of(template.createChatMessage()))
+            .responseFormat(
+                ResponseFormatJsonSchema.create()
+                    .type(ResponseFormatJsonSchema.TypeEnum.JSON_SCHEMA)
+                    .jsonSchema(
+                        ResponseFormatJsonSchemaJsonSchema.create()
+                            .name("translation_response")
+                            .schema(schema)
+                            .strict(true)
+                            .description("Output schema for language translation.")));
+    val configWithTemplate = llmWithImageSupportConfig.withTemplateConfig(templatingConfig);
+
+    val prompt = new OrchestrationPrompt(Message.system("You are a language translator."));
+
+    final var message = client.chatCompletion(prompt, configWithTemplate).getContent();
+    assertThat(message).isEqualTo("{\"translation\":\"Apfel\",\"language\":\"German\"}");
+
+    try (var requestInputStream = fileLoader.apply("jsonSchemaRequest.json")) {
+      final String request = new String(requestInputStream.readAllBytes());
+      verify(postRequestedFor(anyUrl()).withRequestBody(equalToJson(request)));
+    }
+  }
+
+  @Test
+  void testResponseObjectJsonObject() throws IOException {
+    stubFor(
+        post(anyUrl())
+            .willReturn(
+                aResponse()
+                    .withBodyFile("jsonObjectResponse.json")
+                    .withHeader("Content-Type", "application/json")));
+
+    val llmWithImageSupportConfig = new OrchestrationModuleConfig().withLlmConfig(GPT_4O_MINI);
+
+    val template = Message.user("What is 'apple' in German?");
+    val templatingConfig =
+        Template.create()
+            .template(List.of(template.createChatMessage()))
+            .responseFormat(
+                ResponseFormatJsonObject.create()
+                    .type(ResponseFormatJsonObject.TypeEnum.JSON_OBJECT));
+    val configWithTemplate = llmWithImageSupportConfig.withTemplateConfig(templatingConfig);
+
+    val prompt =
+        new OrchestrationPrompt(
+            Message.system(
+                "You are a language translator. Answer using the following JSON format: {\"language\": ..., \"translation\": ...}"));
+
+    final var message = client.chatCompletion(prompt, configWithTemplate).getContent();
+    assertThat(message).isEqualTo("{\"language\": \"German\", \"translation\": \"Apfel\"}");
+
+    try (var requestInputStream = fileLoader.apply("jsonObjectRequest.json")) {
+      final String request = new String(requestInputStream.readAllBytes());
+      verify(postRequestedFor(anyUrl()).withRequestBody(equalToJson(request)));
+    }
+  }
+
+  @Test
+  void testResponseObjectText() throws IOException {
+    stubFor(
+        post(anyUrl())
+            .willReturn(
+                aResponse()
+                    .withBodyFile("responseFormatTextResponse.json")
+                    .withHeader("Content-Type", "application/json")));
+
+    val llmWithImageSupportConfig = new OrchestrationModuleConfig().withLlmConfig(GPT_4O_MINI);
+
+    val template = Message.user("What is 'apple' in German?");
+    val templatingConfig =
+        Template.create()
+            .template(List.of(template.createChatMessage()))
+            .responseFormat(ResponseFormatText.create().type(ResponseFormatText.TypeEnum.TEXT));
+    val configWithTemplate = llmWithImageSupportConfig.withTemplateConfig(templatingConfig);
+
+    val prompt =
+        new OrchestrationPrompt(
+            Message.system("You are a language translator. Answer using JSON."));
+
+    final var message = client.chatCompletion(prompt, configWithTemplate).getContent();
+    assertThat(message)
+        .isEqualTo(
+            "```json\n{\n  \"word\": \"apple\",\n  \"translation\": \"Apfel\",\n  \"language\": \"German\"\n}\n```");
+
+    try (var requestInputStream = fileLoader.apply("responseFormatTextRequest.json")) {
+      final String request = new String(requestInputStream.readAllBytes());
+      verify(postRequestedFor(anyUrl()).withRequestBody(equalToJson(request)));
+    }
+  }
 }
@@ -0,0 +1,59 @@
+{
+  "request_id": "f353a729-3391-4cec-bbf9-7ab39d34ebc1",
+  "module_results": {
+    "templating": [
+      {
+        "role": "user",
+        "content": "What is 'apple' in German?"
+      },
+      {
+        "role": "system",
+        "content": "You are a language translator. Answer using the following JSON format: {\"language\": ..., \"translation\": ...}"
+      }
+    ],
+    "llm": {
+      "id": "chatcmpl-Azm2iclgMiLcQHP3cGQANArkxoiGx",
+      "object": "chat.completion",
+      "created": 1739286048,
+      "model": "gpt-4o-mini-2024-07-18",
+      "system_fingerprint": "fp_f3927aa00d",
+      "choices": [
+        {
+          "index": 0,
+          "message": {
+            "role": "assistant",
+            "content": "{\"language\": \"German\", \"translation\": \"Apfel\"}"
+          },
+          "finish_reason": "stop"
+        }
+      ],
+      "usage": {
+        "completion_tokens": 13,
+        "prompt_tokens": 41,
+        "total_tokens": 54
+      }
+    }
+  },
+  "orchestration_result": {
+    "id": "chatcmpl-Azm2iclgMiLcQHP3cGQANArkxoiGx",
+    "object": "chat.completion",
+    "created": 1739286048,
+    "model": "gpt-4o-mini-2024-07-18",
+    "system_fingerprint": "fp_f3927aa00d",
+    "choices": [
+      {
+        "index": 0,
+        "message": {
+          "role": "assistant",
+          "content": "{\"language\": \"German\", \"translation\": \"Apfel\"}"
+        },
+        "finish_reason": "stop"
+      }
+    ],
+    "usage": {
+      "completion_tokens": 13,
+      "prompt_tokens": 41,
+      "total_tokens": 54
+    }
+  }
+}