supabase
diff --git a/‎ext/ai/js/ai.d.ts‎
Lines changed: 21 additions & 0 deletions b/‎ext/ai/js/ai.d.ts‎
Lines changed: 21 additions & 0 deletions
diff --git a/‎ext/ai/js/ai.js‎
Lines changed: 0 additions & 80 deletions b/‎ext/ai/js/ai.js‎
Lines changed: 0 additions & 80 deletions
diff --git a/‎ext/ai/js/ai.ts‎
Lines changed: 141 additions & 0 deletions b/‎ext/ai/js/ai.ts‎
Lines changed: 141 additions & 0 deletions
diff --git a/‎ext/ai/js/llm/llm_session.ts‎
Lines changed: 47 additions & 18 deletions b/‎ext/ai/js/llm/llm_session.ts‎
Lines changed: 47 additions & 18 deletions
@@ -0,0 +1,21 @@
+import { Session } from "./ai.ts";
+import { LLMSessionRunInputOptions } from "./llm/llm_session.ts";
+import {
+  OllamaProviderInput,
+  OllamaProviderOptions,
+} from "./llm/providers/ollama.ts";
+import {
+  OpenAIProviderInput,
+  OpenAIProviderOptions,
+} from "./llm/providers/openai.ts";
+
+export namespace ai {
+  export { Session };
+  export {
+    LLMSessionRunInputOptions as LLMRunOptions,
+    OllamaProviderInput as OllamaInput,
+    OllamaProviderOptions as OllamaOptions,
+    OpenAIProviderInput as OpenAICompatibleInput,
+    OpenAIProviderOptions as OpenAICompatibleOptions,
+  };
+}
@@ -0,0 +1,141 @@
+import "./onnxruntime/onnx.js";
+import {
+  LLMProviderInstance,
+  LLMProviderName,
+  LLMSession,
+  LLMSessionRunInputOptions as LLMInputOptions,
+  providers,
+} from "./llm/llm_session.ts";
+
+// @ts-ignore deno_core environment
+const core = globalThis.Deno.core;
+
+// NOTE:(kallebysantos) do we still need gte-small? Or maybe add another type 'embeddings' with custom model opt.
+export type SessionType = LLMProviderName | "gte-small";
+
+export type SessionOptions<T extends SessionType> = T extends LLMProviderName
+  ? LLMProviderInstance<T>["options"]
+  : never;
+
+export type SessionInput<T extends SessionType> = T extends LLMProviderName
+  ? LLMProviderInstance<T>["input"]
+  : T extends "gte-small" ? string
+  : never;
+
+export type EmbeddingInputOptions = {
+  /**
+   * Pool embeddings by taking their mean
+   */
+  mean_pool?: boolean;
+
+  /**
+   * Normalize the embeddings result
+   */
+  normalize?: boolean;
+};
+
+export type SessionInputOptions<T extends SessionType> = T extends
+  LLMProviderName ? LLMInputOptions
+  : EmbeddingInputOptions;
+
+export class Session<T extends SessionType> {
+  #model?: string;
+  #init?: Promise<void>;
+
+  // TODO:(kallebysantos) get 'provider' type here and use type checking to suggest Inputs when run
+  constructor(
+    public readonly type: T,
+    public readonly options?: SessionOptions<T>,
+  ) {
+    if (this.isEmbeddingType()) {
+      this.#model = "gte-small"; // Default model
+      this.#init = core.ops.op_ai_init_model(this.#model);
+      return;
+    }
+
+    if (this.isLLMType()) {
+      if (!Object.keys(providers).includes(type)) {
+        throw new TypeError(`invalid type: '${type}'`);
+      }
+
+      if (!this.options || !this.options.model) {
+        throw new Error(
+          `missing required parameter 'model' for type: '${type}'`,
+        );
+      }
+
+      this.options.baseURL ??= core.ops.op_get_env(
+        "AI_INFERENCE_API_HOST",
+      ) as string;
+
+      if (!this.options.baseURL) {
+        throw new Error(
+          `missing required parameter 'baseURL' for type: '${type}'`,
+        );
+      }
+    }
+  }
+
+  //  /** @param {string | object} prompt Either a String (ollama) or an OpenAI chat completion body object (openaicompatible): https://platform.openai.com/docs/api-reference/chat/create */
+  async run(input: SessionInput<T>, options: SessionInputOptions<T>) {
+    if (this.isLLMType()) {
+      const opts = options as LLMInputOptions;
+      const stream = opts.stream ?? false;
+
+      const llmSession = LLMSession.fromProvider(this.type, {
+        // safety: We did check `options` during construction
+        baseURL: this.options!.baseURL,
+        model: this.options!.model,
+        ...this.options, // allows custom provider initialization like 'apiKey'
+      });
+
+      return await llmSession.run(input, {
+        stream,
+        signal: opts.signal,
+        timeout: opts.timeout,
+      });
+    }
+
+    if (this.#init) {
+      await this.#init;
+    }
+
+    const opts = options as EmbeddingInputOptions;
+
+    const mean_pool = opts.mean_pool ?? true;
+    const normalize = opts.normalize ?? true;
+
+    const result = await core.ops.op_ai_run_model(
+      // @ts-ignore
+      this.#model,
+      prompt,
+      mean_pool,
+      normalize,
+    );
+
+    return result;
+  }
+
+  private isEmbeddingType(
+    this: Session<SessionType>,
+  ): this is Session<"gte-small"> {
+    return this.type === "gte-small";
+  }
+
+  private isLLMType(
+    this: Session<SessionType>,
+  ): this is Session<LLMProviderName> {
+    return this.type !== "gte-small";
+  }
+}
+
+const MAIN_WORKER_API = {
+  tryCleanupUnusedSession: () =>
+    /* async */ core.ops.op_ai_try_cleanup_unused_session(),
+};
+
+const USER_WORKER_API = {
+  Session,
+};
+
+export { MAIN_WORKER_API, USER_WORKER_API };
@@ -1,5 +1,5 @@
-import { OllamaLLMSession } from './providers/ollama.ts';
-import { OpenAILLMSession } from './providers/openai.ts';
+import { OllamaLLMSession } from "./providers/ollama.ts";
+import { OpenAILLMSession } from "./providers/openai.ts";
 
 // @ts-ignore deno_core environment
 const core = globalThis.Deno.core;
@@ -20,30 +20,59 @@ export type LLMRunInput = {
   signal?: AbortSignal;
 };
 
+export interface ILLMProviderMeta {
+  input: ILLMProviderInput;
+  output: unknown;
+  options: ILLMProviderOptions;
+}
+
 export interface ILLMProviderOptions {
   model: string;
-  inferenceAPIHost: string;
+  baseURL?: string;
 }
 
-export interface ILLMProviderInput {
-  prompt: string | object;
-  signal: AbortSignal;
-}
+export type ILLMProviderInput<T = string | object> = T extends string ? string
+  : T;
 
 export interface ILLMProvider {
   // TODO:(kallebysantos) remove 'any'
   // TODO: (kallebysantos) standardised output format
-  getStream(input: ILLMProviderInput): Promise<AsyncIterable<any>>;
-  getText(input: ILLMProviderInput): Promise<any>;
+  getStream(
+    input: ILLMProviderInput,
+    signal: AbortSignal,
+  ): Promise<AsyncIterable<any>>;
+  getText(input: ILLMProviderInput, signal: AbortSignal): Promise<any>;
 }
 
 export const providers = {
-  'ollama': OllamaLLMSession,
-  'openaicompatible': OpenAILLMSession,
-} satisfies Record<string, new (opts: ILLMProviderOptions) => ILLMProvider>;
+  "ollama": OllamaLLMSession,
+  "openaicompatible": OpenAILLMSession,
+} satisfies Record<
+  string,
+  new (opts: ILLMProviderOptions) => ILLMProvider & ILLMProviderMeta
+>;
 
 export type LLMProviderName = keyof typeof providers;
 
+export type LLMProviderClass<T extends LLMProviderName> = (typeof providers)[T];
+export type LLMProviderInstance<T extends LLMProviderName> = InstanceType<
+  LLMProviderClass<T>
+>;
+
+export type LLMSessionRunInputOptions = {
+  /**
+   * Stream response from model. Applies only for LLMs like `mistral` (default: false)
+   */
+  stream?: boolean;
+
+  /**
+   * Automatically abort the request to the model after specified time (in seconds). Applies only for LLMs like `mistral` (default: 60)
+   */
+  timeout?: number;
+
+  signal?: AbortSignal;
+};
+
 export class LLMSession {
   #inner: ILLMProvider;
 
@@ -53,31 +82,31 @@ export class LLMSession {
 
   static fromProvider(name: LLMProviderName, opts: ILLMProviderOptions) {
     const ProviderType = providers[name];
-    if (!ProviderType) throw new Error('invalid provider');
+    if (!ProviderType) throw new Error("invalid provider");
 
     const provider = new ProviderType(opts);
 
     return new LLMSession(provider);
   }
 
   run(
-    opts: LLMRunInput,
+    input: ILLMProviderInput,
+    opts: LLMSessionRunInputOptions,
   ): Promise<AsyncIterable<any>> | Promise<any> {
     const isStream = opts.stream ?? false;
 
-    const timeoutSeconds = typeof opts.timeout === 'number' ? opts.timeout : 60;
+    const timeoutSeconds = typeof opts.timeout === "number" ? opts.timeout : 60;
     const timeoutMs = timeoutSeconds * 1000;
 
     const timeoutSignal = AbortSignal.timeout(timeoutMs);
     const abortSignals = [opts.signal, timeoutSignal]
       .filter((it) => it instanceof AbortSignal);
     const signal = AbortSignal.any(abortSignals);
 
-    const llmInput: ILLMProviderInput = { prompt: opts.prompt, signal };
     if (isStream) {
-      return this.#inner.getStream(llmInput);
+      return this.#inner.getStream(input, signal);
     }
 
-    return this.#inner.getText(llmInput);
+    return this.#inner.getText(input, signal);
   }
 }