feat: 🖼️ SDXL prompt optimizer feature (#101)

philippart-s · web-flow · commit 0917ef2867ed · 2025-06-24T09:07:15.000+02:00
* feat: 🖼️ SDXL prompt optimizer feature

* fix: 🐛 Typo on class name

* fix: 🐛 Typo on user prompt
diff --git a/ai/ai-endpoints/README.md b/ai/ai-endpoints/README.md
@@ -15,6 +15,7 @@ Don't hesitate to use the source code and give us feedback.
 
 ### ☕️ Java demos ☕️
 
+  - [Function calling with LangChain4J](./function-calling-langchain4j)
   - [Simple Structured Output](./structured-output-langchain4j/)
   - [Natural Language Processing](./java-nlp)
   - [Chatbot with LangChain4j](./java-langchain4j-chatbot/): blocking mode, streaming mode and RAG mode.
diff --git a/ai/ai-endpoints/function-calling-langchain4j/ImageGeneration.java b/ai/ai-endpoints/function-calling-langchain4j/ImageGeneration.java
@@ -0,0 +1,103 @@
+///usr/bin/env jbang "$0" "$@" ; exit $?
+//JAVA 24+
+//PREVIEW
+//DEPS dev.langchain4j:langchain4j:1.0.1 dev.langchain4j:langchain4j-mistral-ai:1.0.1-beta6
+
+import dev.langchain4j.agent.tool.P;
+import dev.langchain4j.agent.tool.Tool;
+import dev.langchain4j.memory.ChatMemory;
+import dev.langchain4j.memory.chat.MessageWindowChatMemory;
+import dev.langchain4j.model.chat.ChatModel;
+import dev.langchain4j.model.mistralai.MistralAiChatModel;
+import dev.langchain4j.service.AiServices;
+import dev.langchain4j.service.SystemMessage;
+import dev.langchain4j.service.UserMessage;
+
+import java.io.IOException;
+import java.net.URI;
+import java.net.http.HttpClient;
+import java.net.http.HttpRequest;
+import java.net.http.HttpResponse;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.util.Scanner;
+
+class ImageGenTools {
+
+    @Tool("""
+    Tool to create an image with Stable Diffusion XL given a prompt and a negative prompt.
+    """)
+    void generateImage(@P("Prompt that explains the image") String prompt, @P("Negative prompt that explains what the image must not contains") String negativePrompt) throws IOException, InterruptedException {
+        System.out.println("Prompt: " + prompt);
+        System.out.println("Negative prompt: " + negativePrompt);
+
+        HttpRequest httpRequest = HttpRequest.newBuilder()
+                .uri(URI.create(System.getenv("OVH_AI_ENDPOINTS_SD_URL")))
+                .POST(HttpRequest.BodyPublishers.ofString("""
+                        {"prompt": "%s", 
+                         "negative_prompt": "%s"}
+                        """.formatted(prompt, negativePrompt)))
+                .header("accept", "application/octet-stream")
+                .header("Content-Type", "application/json")
+                .header("Authorization", "Bearer " + System.getenv("OVH_AI_ENDPOINTS_SDXL_ACCESS_TOKEN"))
+                .build();
+
+        HttpResponse<byte[]> response = HttpClient.newHttpClient()
+                .send(httpRequest, HttpResponse.BodyHandlers.ofByteArray());
+
+        System.out.println("SDXL status code: " + response.statusCode());
+        Files.write(Path.of("generated-image.jpeg"), response.body());
+    }
+}
+
+/// Chatbot definition.
+/// The goal of the chatbot is to build a powerful prompt for Stable diffusion XML.
+interface ChatBot {
+    @SystemMessage("""
+            Your are an expert of using the Stable Diffusion XL model.
+            The user explains in natural language what kind of image he wants.
+            You must do the following steps:
+              - Understand the user's request.
+              - Generate the two kinds of prompts for stable diffusion: the prompt and the negative prompt
+              - the prompts must be in english and detailed and optimized for the Stable Diffusion XL model. 
+              - once and only once you have this two prompts call the tool with the two prompts.
+            If asked about to create an image, you MUST call the `generateImage` function.
+            """)
+    @UserMessage("Create an image with stable diffusion XL following this description: {{userMessage}}")
+    String chat(String userMessage);
+}
+
+void main() throws Exception {
+
+    // Main chatbot configuration, choose on of the available models on the AI Endpoints catalog (https://endpoints.ai.cloud.ovh.net/catalog)
+    ChatModel chatModel = MistralAiChatModel.builder()
+            .apiKey(System.getenv("OVH_AI_ENDPOINTS_ACCESS_TOKEN"))
+            .baseUrl(System.getenv("OVH_AI_ENDPOINTS_MODEL_URL"))
+            .modelName(System.getenv("OVH_AI_ENDPOINTS_MODEL_NAME"))
+            .logRequests(false)
+            .logResponses(false)
+            // To have more deterministic outputs, set temperature to 0.
+            .temperature(0.0)
+            .build();
+
+    // Add memory to fine tune the SDXL prompt.
+    ChatMemory chatMemory = MessageWindowChatMemory.withMaxMessages(10);
+
+    // Build the chatbot thanks to LangChain4J AI Servises mode
+    ChatBot chatBot = AiServices.builder(ChatBot.class)
+            .chatModel(chatModel)
+            .tools(new ImageGenTools())
+            .chatMemory(chatMemory)
+            .build();
+
+    // Start the conversation loop (enter "exit" to quit)
+    String userInput = "";
+    Scanner scanner = new Scanner(System.in);
+    while (true) {
+        System.out.print("Enter your message: ");
+        userInput = scanner.nextLine();
+        if (userInput.equalsIgnoreCase("exit")) break;
+        System.out.println("Response: " + chatBot.chat(userInput));
+    }
+    scanner.close();
+}
diff --git a/ai/ai-endpoints/function-calling-langchain4j/README.md b/ai/ai-endpoints/function-calling-langchain4j/README.md
@@ -0,0 +1,40 @@
+# Function Calling with LangChain4j and AI Endpoints
+
+### 🧰 Pre requisites 🧰
+
+  - Java 21+ installed (with preview mode enabled)
+  - AI Endpoints API token
+  - model to use: any of the LLM instruct models
+  - have the following environment variables created:
+    - OVH_AI_ENDPOINTS_ACCESS_TOKEN: the API token, see [documentation](https://help.ovhcloud.com/csm/en-gb-public-cloud-ai-endpoints-getting-started?id=kb_article_view&sysparm_article=KB0065401#generating-your-first-api-access-key) to know how to generate it
+    - OVH_AI_ENDPOINTS_MODEL_URL: URL of the model, see [AI Endpoints website](https://endpoints.ai.cloud.ovh.net/) to know how to get it.
+    - OVH_AI_ENDPOINTS_MODEL_NAME: model name, see [AI Endpoints website](https://endpoints.ai.cloud.ovh.net/) to know how to get it.
+    - [JBang](https://www.jbang.dev/documentation/guide/latest/index.html) installed
+
+## ⚡️ How to use the project ⚡️
+
+  - run `jbang ImageGeneration.java` command
+  - explain your image with natural language
+  - see the result in the `generated-image.jpeg`
+  - fine tune your prompt to get better results
+  - enter `exit` to quit the application
+
+## 🗺️ Architecture  🗺️
+
+```mermaid
+graph RL
+    subgraph User app
+        A[Chatbot]
+        D[ImageGenTools]
+   end
+   subgraph AI Endpoints
+        E[Stable Diffusion XL]
+        B[LLM Model]
+    end
+    A[Chatbot] -->| 1-Ask to create an image in natural language | B[LLM Model]
+    B -->| 2-Create a SDXL prompt + tool name | A
+    A -->| 3-Call generateImage | D[ImageGenTools] 
+    D -->| 4-Call SDXL with generated prompts | E[Stable Diffusion XL]
+    E -->| 5-Generated image | D
+    B -->| 6-Final response | A
+```