Added functions for LLM & embeddings to be generated using huggingface

preeesha · preeesha · commit 2c31cd07738a · 2024-08-18T12:03:14.000+05:30
diff --git a/ai-assistant/.gitignore b/ai-assistant/.gitignore
@@ -34,3 +34,4 @@ Temporary Items
 scratch/
 
 test.ts
+credentials.ts
diff --git a/ai-assistant/src/core/embeddings/minilml6.ts b/ai-assistant/src/core/embeddings/minilml6.ts
@@ -1,4 +1,5 @@
 import { IHttp } from "@rocket.chat/apps-engine/definition/accessors";
+import { HF_TOKEN } from "../../credentials";
 import { IEmbeddingModel } from "./embeddings.types";
 
 export class MiniLML6 implements IEmbeddingModel {
@@ -10,7 +11,32 @@ export class MiniLML6 implements IEmbeddingModel {
         this.http = http;
     }
 
+    async fromHuggingFace(text: string): Promise<number[] | null> {
+        const res = await this.http.post(
+            `https://api-inference.huggingface.co/pipeline/feature-extraction/sentence-transformers/all-MiniLM-L6-v2`,
+            {
+                headers: {
+                    accept: "application/json",
+                    "Content-Type": "application/json",
+                    authorization: "Bearer " + HF_TOKEN,
+                },
+                data: {
+                    inputs: [text],
+                    options: {
+                        wait_for_model: true,
+                    },
+                },
+            }
+        );
+        if (!res || res.statusCode !== 200) return null;
+
+        const data = res.data[0] as number[];
+        return data;
+    }
+
     async generate(text: string): Promise<number[] | null> {
+        return await this.fromHuggingFace(text);
+
         const res = await this.http.post(this.baseURL, {
             headers: {
                 accept: "application/json",
diff --git a/ai-assistant/src/core/llm/llama3_70B.ts b/ai-assistant/src/core/llm/llama3_70B.ts
@@ -1,5 +1,6 @@
 import { IHttp } from "@rocket.chat/apps-engine/definition/accessors";
 
+import { HF_TOKEN } from "../../credentials";
 import { Prompt } from "../prompt/prompt";
 import { ILLMModel } from "./llm.types";
 
@@ -12,20 +13,40 @@ export class Llama3_70B implements ILLMModel {
         this.http = http;
     }
 
+    async fromHuggingFace(prompt: Prompt): Promise<string | null> {
+        const url = `https://api-inference.huggingface.co/models/mistralai/Mistral-7B-Instruct-v0.1/v1/chat/completions`;
+        const res = await this.http.post(url, {
+            headers: {
+                "Content-Type": "application/json",
+                authorization: "Bearer " + HF_TOKEN,
+            },
+            data: {
+                messages: prompt.messages,
+                model: "mistralai/Mistral-7B-Instruct-v0.1",
+                stream: false,
+            },
+        });
+        if (!res.content) return null;
+
+        const message = JSON.parse(res.content).choices[0].message.content;
+        return message;
+    }
+
     async ask(prompt: Prompt): Promise<string | null> {
+        return await this.fromHuggingFace(prompt);
+
         const url = `${this.baseURL}/chat/completions`;
         const res = await this.http.post(url, {
             headers: {
                 "Content-Type": "application/json",
             },
             data: {
-                model: this.model,
-                temprature: 0,
                 messages: prompt.messages,
             },
         });
         if (!res.content) return null;
 
+        // @ts-ignore
         const message = JSON.parse(res.content).choices[0].message.content;
         return message;
     }

Original file line number	Diff line number	Diff line change
`@@ -34,3 +34,4 @@ Temporary Items`
`34`	`34`	`scratch/`
`35`	`35`
`36`	`36`	`test.ts`
	`37`	`+credentials.ts`