Azure-Samples
diff --git a/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/Application.java
Lines changed: 15 additions & 0 deletions b/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/Application.java
Lines changed: 15 additions & 0 deletions
diff --git a/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/approaches/RAGApproachFactorySpringBootImpl.java
Lines changed: 18 additions & 7 deletions b/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/approaches/RAGApproachFactorySpringBootImpl.java
Lines changed: 18 additions & 7 deletions
diff --git a/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/ask/approaches/semantickernel/JavaSemanticKernelChainsApproach.java
Lines changed: 0 additions & 3 deletions b/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/ask/approaches/semantickernel/JavaSemanticKernelChainsApproach.java
Lines changed: 0 additions & 3 deletions
diff --git a/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/chat/approaches/semantickernel/JavaSemanticKernelChainsChatApproach.java
Lines changed: 140 additions & 0 deletions b/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/chat/approaches/semantickernel/JavaSemanticKernelChainsChatApproach.java
Lines changed: 140 additions & 0 deletions
diff --git a/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/chat/approaches/semantickernel/JavaSemanticKernelWithMemoryChatApproach.java
Lines changed: 168 additions & 0 deletions b/‎app/backend/src/main/java/com/microsoft/openai/samples/rag/chat/approaches/semantickernel/JavaSemanticKernelWithMemoryChatApproach.java
Lines changed: 168 additions & 0 deletions
@@ -4,6 +4,9 @@
 import org.slf4j.LoggerFactory;
 import org.springframework.boot.SpringApplication;
 import org.springframework.boot.autoconfigure.SpringBootApplication;
+import org.springframework.context.annotation.Bean;
+import org.springframework.web.servlet.config.annotation.CorsRegistry;
+import org.springframework.web.servlet.config.annotation.WebMvcConfigurer;
 
 @SpringBootApplication
 public class Application {
@@ -14,4 +17,16 @@ public static void main(String[] args) {
         LOG.info("Application profile from system property is [{}]", System.getProperty("spring.profiles.active"));
         new SpringApplication(Application.class).run(args);
     }
+
+    @Bean
+    public WebMvcConfigurer corsConfigurer() {
+        return new WebMvcConfigurer() {
+            @Override
+            public void addCorsMappings(CorsRegistry registry) {
+                registry
+                        .addMapping("/api/**")
+                        .allowedOrigins("http://localhost:8080");
+            }
+        };
+    }
 }
@@ -2,9 +2,11 @@
 
 import com.microsoft.openai.samples.rag.ask.approaches.PlainJavaAskApproach;
 import com.microsoft.openai.samples.rag.ask.approaches.semantickernel.JavaSemanticKernelChainsApproach;
-import com.microsoft.openai.samples.rag.ask.approaches.semantickernel.JavaSemanticKernelWithMemoryApproach;
 import com.microsoft.openai.samples.rag.ask.approaches.semantickernel.JavaSemanticKernelPlannerApproach;
+import com.microsoft.openai.samples.rag.ask.approaches.semantickernel.JavaSemanticKernelWithMemoryApproach;
 import com.microsoft.openai.samples.rag.chat.approaches.PlainJavaChatApproach;
+import com.microsoft.openai.samples.rag.chat.approaches.semantickernel.JavaSemanticKernelChainsChatApproach;
+import com.microsoft.openai.samples.rag.chat.approaches.semantickernel.JavaSemanticKernelWithMemoryChatApproach;
 import org.springframework.context.ApplicationContext;
 import org.springframework.context.ApplicationContextAware;
 import org.springframework.stereotype.Component;
@@ -27,18 +29,27 @@ public class RAGApproachFactorySpringBootImpl implements RAGApproachFactory, App
     @Override
     public RAGApproach createApproach(String approachName, RAGType ragType, RAGOptions ragOptions) {
 
-        if (ragType.equals(RAGType.CHAT) && JAVA_OPENAI_SDK.equals(approachName)) {
-            return applicationContext.getBean(PlainJavaChatApproach.class);
-
+        if (ragType.equals(RAGType.CHAT)) {
+            if (JAVA_SEMANTIC_KERNEL.equals(approachName)) {
+                return applicationContext.getBean(JavaSemanticKernelWithMemoryChatApproach.class);
+            } else if (
+                    JAVA_SEMANTIC_KERNEL_PLANNER.equals(approachName) &&
+                            ragOptions != null &&
+                            ragOptions.getSemantickKernelMode() != null &&
+                            ragOptions.getSemantickKernelMode() == SemanticKernelMode.chains) {
+                return applicationContext.getBean(JavaSemanticKernelChainsChatApproach.class);
+            } else {
+                return applicationContext.getBean(PlainJavaChatApproach.class);
+            }
         } else if (ragType.equals(RAGType.ASK)) {
             if (JAVA_OPENAI_SDK.equals(approachName))
                 return applicationContext.getBean(PlainJavaAskApproach.class);
             else if (JAVA_SEMANTIC_KERNEL.equals(approachName))
                 return applicationContext.getBean(JavaSemanticKernelWithMemoryApproach.class);
             else if (JAVA_SEMANTIC_KERNEL_PLANNER.equals(approachName) && ragOptions.getSemantickKernelMode() != null && ragOptions.getSemantickKernelMode() == SemanticKernelMode.planner)
-                      return  applicationContext.getBean(JavaSemanticKernelPlannerApproach.class);
-                    else if(JAVA_SEMANTIC_KERNEL_PLANNER.equals(approachName) && ragOptions != null && ragOptions.getSemantickKernelMode() != null && ragOptions.getSemantickKernelMode() == SemanticKernelMode.chains)
-                        return applicationContext.getBean(JavaSemanticKernelChainsApproach.class);
+                return applicationContext.getBean(JavaSemanticKernelPlannerApproach.class);
+            else if (JAVA_SEMANTIC_KERNEL_PLANNER.equals(approachName) && ragOptions != null && ragOptions.getSemantickKernelMode() != null && ragOptions.getSemantickKernelMode() == SemanticKernelMode.chains)
+                return applicationContext.getBean(JavaSemanticKernelChainsApproach.class);
 
         }
         //if this point is reached then the combination of approach and rag type is not supported
 
@@ -127,7 +127,4 @@ private Kernel buildSemanticKernel( RAGOptions options) {
 
         return kernel;
     }
-
-
-
 }
@@ -0,0 +1,140 @@
+package com.microsoft.openai.samples.rag.chat.approaches.semantickernel;
+
+import com.azure.ai.openai.OpenAIAsyncClient;
+import com.microsoft.openai.samples.rag.approaches.ContentSource;
+import com.microsoft.openai.samples.rag.approaches.RAGApproach;
+import com.microsoft.openai.samples.rag.approaches.RAGOptions;
+import com.microsoft.openai.samples.rag.approaches.RAGResponse;
+import com.microsoft.openai.samples.rag.ask.approaches.semantickernel.CognitiveSearchPlugin;
+import com.microsoft.openai.samples.rag.common.ChatGPTConversation;
+import com.microsoft.openai.samples.rag.common.ChatGPTUtils;
+import com.microsoft.openai.samples.rag.proxy.CognitiveSearchProxy;
+import com.microsoft.openai.samples.rag.proxy.OpenAIProxy;
+import com.microsoft.semantickernel.Kernel;
+import com.microsoft.semantickernel.SKBuilders;
+import com.microsoft.semantickernel.chatcompletion.ChatCompletion;
+import com.microsoft.semantickernel.orchestration.SKContext;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import org.springframework.beans.factory.annotation.Value;
+import org.springframework.stereotype.Component;
+
+import java.io.OutputStream;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
+import java.util.Objects;
+import java.util.stream.Collectors;
+
+/**
+ * Simple chat-read-retrieve-read java implementation, using the Cognitive Search and OpenAI APIs directly.
+ * It uses the ChatGPT API to turn the user question into a good search query.
+ * It queries Azure Cognitive Search for search results for that query (optionally using the vector embeddings for that query).
+ * It then combines the search results and original user question, and asks ChatGPT API to answer the question based on the sources. It includes the last 4K of message history as well (or however many tokens are allowed by the deployed model).
+ */
+@Component
+public class JavaSemanticKernelChainsChatApproach implements RAGApproach<ChatGPTConversation, RAGResponse> {
+
+    private static final Logger LOGGER = LoggerFactory.getLogger(JavaSemanticKernelChainsChatApproach.class);
+    private static final String PLAN_PROMPT = """
+            Take the input as a question and answer it finding any information needed
+            """;
+    private final CognitiveSearchProxy cognitiveSearchProxy;
+
+    private final OpenAIProxy openAIProxy;
+
+    private final OpenAIAsyncClient openAIAsyncClient;
+
+    @Value("${openai.chatgpt.deployment}")
+    private String gptChatDeploymentModelId;
+
+    public JavaSemanticKernelChainsChatApproach(CognitiveSearchProxy cognitiveSearchProxy, OpenAIAsyncClient openAIAsyncClient, OpenAIProxy openAIProxy) {
+        this.cognitiveSearchProxy = cognitiveSearchProxy;
+        this.openAIAsyncClient = openAIAsyncClient;
+        this.openAIProxy = openAIProxy;
+    }
+
+    /**
+     * @param questionOrConversation
+     * @param options
+     * @return
+     */
+    @Override
+    public RAGResponse run(ChatGPTConversation questionOrConversation, RAGOptions options) {
+
+        String question = ChatGPTUtils.getLastUserQuestion(questionOrConversation.getMessages());
+
+        Kernel semanticKernel = buildSemanticKernel(options);
+
+        SKContext searchContext =
+                semanticKernel.runAsync(
+                        question,
+                        semanticKernel.getSkill("InformationFinder").getFunction("Search", null)).block();
+
+        var sources = formSourcesList(searchContext.getResult());
+
+        var answerVariables = SKBuilders.variables()
+                .withVariable("sources", searchContext.getResult())
+                .withVariable("input", question)
+                .build();
+
+        SKContext answerExecutionContext =
+                semanticKernel.runAsync(answerVariables,
+                        semanticKernel.getSkill("RAG").getFunction("AnswerQuestion", null)).block();
+        return new RAGResponse.Builder()
+                .prompt("Prompt is managed by Semantic Kernel")
+                .answer(answerExecutionContext.getResult())
+                .sources(sources)
+                .sourcesAsText(searchContext.getResult())
+                .question(question)
+                .build();
+    }
+
+    @Override
+    public void runStreaming(
+            ChatGPTConversation questionOrConversation,
+            RAGOptions options,
+            OutputStream outputStream) {
+    }
+
+    private List<ContentSource> formSourcesList(String result) {
+        if (result == null) {
+            return Collections.emptyList();
+        }
+        return Arrays.stream(result
+                        .split("\n"))
+                .map(source -> {
+                    String[] split = source.split(":", 2);
+                    if (split.length >= 2) {
+                        var sourceName = split[0].trim();
+                        var sourceContent = split[1].trim();
+                        return new ContentSource(sourceName, sourceContent);
+                    } else {
+                        return null;
+                    }
+                })
+                .filter(Objects::nonNull)
+                .collect(Collectors.toList());
+    }
+
+    private Kernel buildSemanticKernel(RAGOptions options) {
+        Kernel kernel = SKBuilders.kernel()
+                .withDefaultAIService(SKBuilders.chatCompletion()
+                        .withModelId(gptChatDeploymentModelId)
+                        .withOpenAIClient(this.openAIAsyncClient)
+                        .build())
+                .build();
+
+        kernel.importSkill(new CognitiveSearchPlugin(this.cognitiveSearchProxy, this.openAIProxy, options), "InformationFinder");
+
+        kernel.importSkillFromResources(
+                "semantickernel/Plugins",
+                "RAG",
+                "AnswerQuestion",
+                null
+        );
+
+        return kernel;
+    }
+
+}
@@ -0,0 +1,168 @@
+package com.microsoft.openai.samples.rag.chat.approaches.semantickernel;
+
+import com.azure.ai.openai.OpenAIAsyncClient;
+import com.azure.core.credential.TokenCredential;
+import com.azure.search.documents.SearchAsyncClient;
+import com.azure.search.documents.SearchDocument;
+import com.microsoft.openai.samples.rag.approaches.ContentSource;
+import com.microsoft.openai.samples.rag.approaches.RAGApproach;
+import com.microsoft.openai.samples.rag.approaches.RAGOptions;
+import com.microsoft.openai.samples.rag.approaches.RAGResponse;
+import com.microsoft.openai.samples.rag.ask.approaches.semantickernel.memory.CustomAzureCognitiveSearchMemoryStore;
+import com.microsoft.openai.samples.rag.common.ChatGPTConversation;
+import com.microsoft.openai.samples.rag.common.ChatGPTUtils;
+import com.microsoft.semantickernel.Kernel;
+import com.microsoft.semantickernel.SKBuilders;
+import com.microsoft.semantickernel.ai.embeddings.Embedding;
+import com.microsoft.semantickernel.memory.MemoryQueryResult;
+import com.microsoft.semantickernel.memory.MemoryRecord;
+import com.microsoft.semantickernel.orchestration.SKContext;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import org.springframework.beans.factory.annotation.Value;
+import org.springframework.stereotype.Component;
+import reactor.core.publisher.Mono;
+
+import java.io.OutputStream;
+import java.util.List;
+import java.util.function.Function;
+import java.util.stream.Collectors;
+
+/**
+ * Accomplish the same task as in the PlainJavaAskApproach approach but using Semantic Kernel framework:
+ * 1. Memory abstraction is used for vector search capability. It uses Azure Cognitive Search as memory store.
+ * 2. Semantic function has been defined to ask question using sources from memory search results
+ */
+@Component
+public class JavaSemanticKernelWithMemoryChatApproach implements RAGApproach<ChatGPTConversation, RAGResponse> {
+    private static final Logger LOGGER = LoggerFactory.getLogger(JavaSemanticKernelWithMemoryChatApproach.class);
+    private final TokenCredential tokenCredential;
+    private final OpenAIAsyncClient openAIAsyncClient;
+
+    private final SearchAsyncClient searchAsyncClient;
+
+    private final String EMBEDDING_FIELD_NAME = "embedding";
+
+    @Value("${cognitive.search.service}")
+    String searchServiceName;
+    @Value("${cognitive.search.index}")
+    String indexName;
+    @Value("${openai.chatgpt.deployment}")
+    private String gptChatDeploymentModelId;
+
+    @Value("${openai.embedding.deployment}")
+    private String embeddingDeploymentModelId;
+
+    public JavaSemanticKernelWithMemoryChatApproach(TokenCredential tokenCredential, OpenAIAsyncClient openAIAsyncClient, SearchAsyncClient searchAsyncClient) {
+        this.tokenCredential = tokenCredential;
+        this.openAIAsyncClient = openAIAsyncClient;
+        this.searchAsyncClient = searchAsyncClient;
+    }
+
+    @Override
+    public RAGResponse run(ChatGPTConversation questionOrConversation, RAGOptions options) {
+
+        String question = ChatGPTUtils.getLastUserQuestion(questionOrConversation.getMessages());
+
+        //Build semantic kernel with Azure Cognitive Search as memory store. AnswerQuestion skill is imported from resources.
+        Kernel semanticKernel = buildSemanticKernel(options);
+
+        /**
+         * Use semantic kernel built-in memory.searchAsync. It uses OpenAI to generate embeddings for the provided question.
+         * Question embeddings are provided to cognitive search via search options.
+         */
+        List<MemoryQueryResult> memoryResult = semanticKernel.getMemory().searchAsync(
+                        indexName,
+                        question,
+                        options.getTop(),
+                        0.5f,
+                        false)
+                .block();
+
+        LOGGER.info("Total {} sources found in cognitive vector store for search query[{}]", memoryResult.size(), question);
+
+        String sources = buildSourcesText(memoryResult);
+        List<ContentSource> sourcesList = buildSources(memoryResult);
+
+        SKContext skcontext = SKBuilders.context().build()
+                .setVariable("sources", sources)
+                .setVariable("input", question);
+
+
+        Mono<SKContext> result = semanticKernel.getFunction("RAG", "AnswerQuestion").invokeAsync(skcontext);
+
+        return new RAGResponse.Builder()
+                //.prompt(plan.toPlanString())
+                .prompt("placeholders for prompt")
+                .answer(result.block().getResult())
+                .sources(sourcesList)
+                .sourcesAsText(sources)
+                .question(question)
+                .build();
+
+    }
+
+    @Override
+    public void runStreaming(ChatGPTConversation questionOrConversation, RAGOptions options, OutputStream outputStream) {
+        throw new IllegalStateException("Streaming not supported for this approach");
+    }
+
+    private List<ContentSource> buildSources(List<MemoryQueryResult> memoryResult) {
+        return memoryResult
+                .stream()
+                .map(result -> {
+                    return new ContentSource(
+                            result.getMetadata().getId(),
+                            result.getMetadata().getText()
+                    );
+                })
+                .collect(Collectors.toList());
+    }
+
+    private String buildSourcesText(List<MemoryQueryResult> memoryResult) {
+        StringBuilder sourcesContentBuffer = new StringBuilder();
+        memoryResult.stream().forEach(memory -> {
+            sourcesContentBuffer.append(memory.getMetadata().getId())
+                    .append(": ")
+                    .append(memory.getMetadata().getText().replace("\n", ""))
+                    .append("\n");
+        });
+        return sourcesContentBuffer.toString();
+    }
+
+    private Kernel buildSemanticKernel(RAGOptions options) {
+        var kernelWithACS = SKBuilders.kernel()
+                .withMemoryStorage(
+                        new CustomAzureCognitiveSearchMemoryStore("https://%s.search.windows.net".formatted(searchServiceName),
+                                tokenCredential,
+                                this.searchAsyncClient,
+                                this.EMBEDDING_FIELD_NAME,
+                                buildCustomMemoryMapper()))
+                .withDefaultAIService(SKBuilders.textEmbeddingGeneration()
+                        .withOpenAIClient(openAIAsyncClient)
+                        .withModelId(embeddingDeploymentModelId)
+                        .build())
+                .withDefaultAIService(SKBuilders.chatCompletion()
+                        .withModelId(gptChatDeploymentModelId)
+                        .withOpenAIClient(this.openAIAsyncClient)
+                        .build())
+                .build();
+
+        kernelWithACS.importSkillFromResources("semantickernel/Plugins", "RAG", "AnswerQuestion", null);
+        return kernelWithACS;
+    }
+
+    private Function<SearchDocument, MemoryRecord> buildCustomMemoryMapper() {
+        return searchDocument -> {
+            return MemoryRecord.localRecord(
+                    (String) searchDocument.get("sourcepage"),
+                    (String) searchDocument.get("content"),
+                    "chunked text from original source",
+                    new Embedding((List<Float>) searchDocument.get(EMBEDDING_FIELD_NAME)),
+                    (String) searchDocument.get("category"),
+                    (String) searchDocument.get("id"),
+                    null);
+
+        };
+    }
+}
Original file line number	Diff line number	Diff line change
`@@ -127,7 +127,4 @@ private Kernel buildSemanticKernel( RAGOptions options) {`
`127`	`127`
`128`	`128`	`return kernel;`
`129`	`129`	`}`
`130`		`-`
`131`		`-`
`132`		`-`
`133`	`130`	`}`