feat: add OpenAI compatible chat endpoint

n4ze3m · n4ze3m · commit fe93067a6d85 · 2024-07-30T23:56:33.000+05:30
diff --git a/app/ui/src/routes/bot/ds.tsx b/app/ui/src/routes/bot/ds.tsx
@@ -46,7 +46,7 @@ export default function BotDSRoot() {
     <div className="mx-auto my-3 w-full max-w-7xl">
       {status === "loading" && <SkeletonLoading />}
       {status === "success" && (
-        <div  className="px-4 sm:px-6 lg:px-8">
+        <div className="px-4 sm:px-6 lg:px-8">
           <DsTable data={botData.data} />
           {botData.total >= 10 && (
             <div className="my-3 flex items-center justify-end">
diff --git a/server/src/handlers/api/v1/bot/bot/delete.handler.ts b/server/src/handlers/api/v1/bot/bot/delete.handler.ts
@@ -14,7 +14,7 @@ export const deleteSourceByIdHandler = async (
   const bot = await prisma.bot.findFirst({
     where: {
       id: bot_id,
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
   });
 
@@ -79,7 +79,7 @@ export const deleteBotByIdHandler = async (
   const bot = await prisma.bot.findFirst({
     where: {
       id,
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
   });
 
diff --git a/server/src/handlers/api/v1/bot/bot/get.handler.ts b/server/src/handlers/api/v1/bot/bot/get.handler.ts
@@ -14,7 +14,7 @@ export const getBotByIdEmbeddingsHandler = async (
   const bot = await prisma.bot.findFirst({
     where: {
       id,
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
   });
 
@@ -100,7 +100,7 @@ export const getBotByIdHandler = async (
   const bot = await prisma.bot.findFirst({
     where: {
       id,
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
   });
 
@@ -122,7 +122,7 @@ export const getAllBotsHandler = async (
 
   const bots = await prisma.bot.findMany({
     where: {
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
     orderBy: {
       createdAt: "desc",
@@ -216,7 +216,7 @@ export const getBotByIdSettingsHandler = async (
   const bot = await prisma.bot.findFirst({
     where: {
       id,
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
   });
   if (!bot) {
@@ -292,7 +292,7 @@ export const isBotReadyHandler = async (
   const bot = await prisma.bot.findFirst({
     where: {
       id,
-      user_id: request.user.user_id,
+      user_id: request.user?.is_admin ? undefined : request.user?.user_id
     },
   });
 
diff --git a/server/src/handlers/api/v1/openai/chat.handler.ts b/server/src/handlers/api/v1/openai/chat.handler.ts
@@ -0,0 +1,187 @@
+import type { FastifyRequest, FastifyReply } from "fastify";
+import type { OpenaiRequestType } from "./type"
+import { getModelInfo } from "../../../../utils/get-model-info";
+import { embeddings } from "../../../../utils/embeddings";
+import { Document } from "langchain/document";
+import { BaseRetriever } from "@langchain/core/retrievers";
+import { DialoqbaseHybridRetrival } from "../../../../utils/hybrid";
+import { DialoqbaseVectorStore } from "../../../../utils/store";
+import { createChatModel } from "../bot/playground/chat.service";
+import { createChain } from "../../../../chain";
+import { openaiNonStreamResponse, openaiStreamResponse } from "./openai-response";
+import { groupOpenAiMessages } from "./other";
+import { nextTick } from "../../../../utils/nextTick";
+
+
+export const createChatCompletionHandler = async (
+    request: FastifyRequest<OpenaiRequestType>,
+    reply: FastifyReply
+) => {
+    try {
+        const {
+            model,
+            messages
+        } = request.body;
+
+        const prisma = request.server.prisma;
+
+        const bot = await prisma.bot.findFirst({
+            where: {
+                OR: [
+                    {
+                        id: model
+                    },
+                    {
+                        publicId: model
+                    }
+                ],
+                user_id: request.user.is_admin ? undefined : request.user.user_id,
+            },
+        })
+
+        if (!bot) {
+            return reply.status(404).send({
+                error: {
+                    message: "Bot not found",
+                    type: "not_found",
+                    param: "model",
+                    code: "bot_not_found"
+                }
+            });
+        }
+
+
+        const embeddingInfo = await getModelInfo({
+            prisma,
+            model: bot.embedding,
+            type: "embedding",
+        });
+
+        if (!embeddingInfo) {
+            return reply.status(400).send({
+                error: {
+                    message: "Embedding not found",
+                    type: "not_found",
+                    param: "embedding",
+                    code: "embedding_not_found"
+                }
+            });
+        }
+
+
+        const embeddingModel = embeddings(
+            embeddingInfo.model_provider!.toLowerCase(),
+            embeddingInfo.model_id,
+            embeddingInfo?.config
+        );
+
+        const modelinfo = await getModelInfo({
+            prisma,
+            model: bot.model,
+            type: "chat",
+        });
+
+        if (!modelinfo) {
+            return reply.status(400).send({
+                error: {
+                    message: "Model not found",
+                    type: "not_found",
+                    param: "model",
+                    code: "model_not_found"
+                }
+            });
+        }
+
+        const botConfig = (modelinfo.config as {}) || {};
+        let retriever: BaseRetriever;
+        let resolveWithDocuments: (value: Document[]) => void;
+
+        if (bot.use_hybrid_search) {
+            retriever = new DialoqbaseHybridRetrival(embeddingModel, {
+                botId: bot.id,
+                sourceId: null,
+                callbacks: [
+                    {
+                        handleRetrieverEnd(documents) {
+                            resolveWithDocuments(documents);
+                        },
+                    },
+                ],
+            });
+        } else {
+            const vectorstore = await DialoqbaseVectorStore.fromExistingIndex(
+                embeddingModel,
+                {
+                    botId: bot.id,
+                    sourceId: null,
+                }
+            );
+
+            retriever = vectorstore.asRetriever({
+            });
+        }
+
+        const streamedModel = createChatModel(
+            bot,
+            bot.temperature,
+            botConfig,
+            true
+        );
+        const nonStreamingModel = createChatModel(bot, bot.temperature, botConfig);
+
+        const chain = createChain({
+            llm: streamedModel,
+            question_llm: nonStreamingModel,
+            question_template: bot.questionGeneratorPrompt,
+            response_template: bot.qaPrompt,
+            retriever,
+        });
+
+        if (!request.body.stream) {
+            const res = await chain.invoke({
+                question: messages[messages.length - 1].content,
+                chat_history: groupOpenAiMessages(
+                    messages
+                ),
+            })
+
+
+            return reply.status(200).send(openaiNonStreamResponse(
+                res,
+                bot.name
+            ))
+        }
+
+        const stream = await chain.stream({
+            question: messages[messages.length - 1].content,
+            chat_history: groupOpenAiMessages(
+                messages
+            ),
+        })
+        reply.raw.setHeader("Content-Type", "text/event-stream");
+
+        for await (const token of stream) {
+            reply.sse({
+                data: openaiStreamResponse(
+                    token || "",
+                    bot.name
+                )
+            });
+        }
+        reply.sse({
+            data: "[DONE]\n\n"
+        })
+        await nextTick();
+        return reply.raw.end();
+    } catch (error) {
+        console.log(error)
+        return reply.status(500).send({
+            error: {
+                message: error.message,
+                type: "internal_server_error",
+                param: null,
+                code: "internal_server_error"
+            }
+        });
+    }
+}
diff --git a/server/src/handlers/api/v1/openai/openai-response.ts b/server/src/handlers/api/v1/openai/openai-response.ts
@@ -0,0 +1,35 @@
+import { randomUUID } from "node:crypto";
+
+export const openaiNonStreamResponse = (message: string, model: string) => {
+  return {
+    id: randomUUID(),
+    created: new Date().toISOString(),
+    model,
+    choices: [
+      {
+        index: 0,
+        message: {
+          role: "assistant",
+          content: message,
+        },
+      },
+    ],
+    object: "chat.completion",
+  };
+};
+
+export const openaiStreamResponse = (message: string, model: string) => {
+  return JSON.stringify({
+    id: randomUUID(),
+    created: new Date().toISOString(),
+    model,
+    object: "chat.completion.chunk",
+    choices: [
+      {
+        delta: {
+          content: message,
+        },
+      },
+    ],
+  });
+};
diff --git a/server/src/handlers/api/v1/openai/other.ts b/server/src/handlers/api/v1/openai/other.ts
@@ -0,0 +1,21 @@
+export function groupOpenAiMessages(
+  messages: {
+    role: "user" | "assistant";
+    content: string;
+  }[]
+) {
+  if (messages.length % 2 !== 0) {
+    messages.pop();
+  }
+
+  const groupedMessages = [];
+  for (let i = 0; i < messages.length; i += 2) {
+    groupedMessages.push({
+      [messages[i].role === "user" ? "human" : "ai"]: messages[i].content,
+      [messages[i + 1].role === "user" ? "human" : "ai"]:
+        messages[i + 1].content,
+    });
+  }
+
+  return groupedMessages;
+}
diff --git a/server/src/handlers/api/v1/openai/type.ts b/server/src/handlers/api/v1/openai/type.ts
@@ -0,0 +1,11 @@
+export interface OpenaiRequestType {
+    Body: {
+        messages: {
+            role: "user" | "assistant";
+            content: string;
+        }[]
+        model: string;
+        stream: boolean;
+        temperature: number;
+    }
+}
diff --git a/server/src/plugins/jwt.ts b/server/src/plugins/jwt.ts
diff --git a/server/src/routes/api/v1/openai/root.ts b/server/src/routes/api/v1/openai/root.ts
diff --git a/server/src/schema/api/v1/openai/index.ts b/server/src/schema/api/v1/openai/index.ts