Add muna.beta.chat.completions.create

olokobayusuf · olokobayusuf · commit 23f374ffd9e4 · 2025-08-11T17:50:07.000-04:00
diff --git a/Changelog.md b/Changelog.md
@@ -1,5 +1,5 @@
 ## 0.0.47
-*INCOMPLETE*
++ Added `muna.beta.chat.completions.create` method to create chat completions mirroring the OpenAI client.
 
 ## 0.0.46
 + Function is now Muna!
diff --git a/package.json b/package.json
@@ -30,6 +30,18 @@
   "main": "build/lib/index.js",
   "typings": "build/types/index.d.ts",
   "unpkg": "build/umd/muna.js",
+  "exports": {
+    ".": {
+      "types": "./build/types/index.d.ts",
+      "import": "./build/lib/index.js",
+      "require": "./build/lib/index.js"
+    },
+    "./beta": {
+      "types": "./build/types/beta/types.d.ts",
+      "import": "./build/lib/beta/types.js",
+      "require": "./build/lib/beta/types.js"
+    }
+  },
   "dependencies": {
     "base64-arraybuffer": "^1.0.2",
     "chalk": "^5.3.0",
diff --git a/src/beta/chat/chat.ts b/src/beta/chat/chat.ts
@@ -0,0 +1,20 @@
+/*
+*   Muna
+*   Copyright © 2025 NatML Inc. All Rights Reserved.
+*/
+
+import type { PredictionService } from "../../services"
+import type { RemotePredictionService } from "../remote"
+import { ChatCompletionsService } from "./completions"
+
+export class ChatService {
+
+    /**
+     * Create completions.
+     */
+    public readonly completions: ChatCompletionsService;
+
+    public constructor(predictions: PredictionService, remotePredictions: RemotePredictionService) {
+        this.completions = new ChatCompletionsService(predictions, remotePredictions);
+    }
+}
diff --git a/src/beta/chat/completions.ts b/src/beta/chat/completions.ts
@@ -0,0 +1,110 @@
+/*
+*   Muna
+*   Copyright © 2025 NatML Inc. All Rights Reserved.
+*/
+
+import type { CreatePredictionInput, PredictionService } from "../../services"
+import type { Acceleration, Prediction } from "../../types"
+import type { CreateRemotePredictionInput, RemoteAcceleration, RemotePredictionService } from "../remote"
+import type { ChatCompletion, ChatCompletionChunk, ChatCompletionMessage } from "./types"
+
+export interface ChatCompletionCreateParamsBase {
+    /**
+     * Messages comprising the conversation so far.
+     */
+    messages: ChatCompletionMessage[];
+    /**
+     * Chat model predictor tag.
+     */
+    model: string;
+    /**
+     * Maximum output tokens.
+     */
+    max_tokens?: number | null;
+    /**
+     * Prediction acceleration.
+     */
+    acceleration?: Acceleration | RemoteAcceleration;
+}
+
+export interface ChatCompletionCreateParamsNonStreaming extends ChatCompletionCreateParamsBase {
+    /**
+     * Whether to stream responses.
+     */
+    stream?: false | null;
+}
+
+export interface ChatCompletionCreateParamsStreaming extends ChatCompletionCreateParamsBase {
+    /**
+     * Whether to stream responses.
+     */
+    stream: true;
+}
+
+export type ChatCompletionCreateParams = (
+    ChatCompletionCreateParamsNonStreaming |
+    ChatCompletionCreateParamsStreaming
+);
+
+export class ChatCompletionsService {
+
+    private readonly predictions: PredictionService;
+    private readonly remotePredictions: RemotePredictionService;
+
+    public constructor(predictions: PredictionService, remotePredictions: RemotePredictionService) {
+        this.predictions = predictions;
+        this.remotePredictions = remotePredictions;
+    }
+
+    /**
+     * Create a chat completion.
+     */
+    public create(body: ChatCompletionCreateParamsNonStreaming): Promise<ChatCompletion>;
+    public create(body: ChatCompletionCreateParamsStreaming): AsyncGenerator<ChatCompletionChunk>;
+    public create(body: ChatCompletionCreateParamsBase): Promise<ChatCompletion> | AsyncGenerator<ChatCompletionChunk>;
+    public create(body: ChatCompletionCreateParams): Promise<ChatCompletion> | AsyncGenerator<ChatCompletionChunk> {
+        const { model: tag, acceleration = "auto", ...inputs } = body;
+        inputs.stream = inputs.stream ?? false;
+        const input = { tag, inputs, acceleration };
+        if (inputs.stream)
+            return this.createCompletionStreaming(input);
+        else
+            return this.createCompletionNonStreaming(input);
+    }
+
+    private async createCompletionNonStreaming(input: CreatePredictionInput | CreateRemotePredictionInput): Promise<ChatCompletion> {
+        const prediction = await this.createPrediction(input);
+        const completion = this.parseResponse(prediction) as ChatCompletion;
+        return completion;
+    }
+
+    private async * createCompletionStreaming(input: CreatePredictionInput | CreateRemotePredictionInput): AsyncGenerator<ChatCompletionChunk> {
+        const stream = await this.streamPrediction(input);
+        for await (const prediction of stream) {
+            const completion = this.parseResponse(prediction) as ChatCompletionChunk;
+            yield completion;
+        }
+    }
+
+    private createPrediction(input: CreatePredictionInput | CreateRemotePredictionInput): Promise<Prediction> {
+        // muna.beta.predictions.remote.create(...)
+        if ((input.acceleration as string).startsWith("remote_"))
+            return this.remotePredictions.create(input as CreateRemotePredictionInput);
+        // muna.predictions.create(...)
+        else
+            return this.predictions.create(input as CreatePredictionInput);
+    }
+
+    private streamPrediction(input: CreatePredictionInput | CreateRemotePredictionInput): AsyncGenerator<Prediction> {
+        if ((input.acceleration as string).startsWith("remote_"))
+            throw new Error("Streaming predictions are not supported with remote acceleration");
+        // muna.predictions.stream(...)
+        return this.predictions.stream(input as CreatePredictionInput);
+    }
+
+    private parseResponse(prediction: Prediction): ChatCompletion | ChatCompletionChunk {
+        if (prediction.error)
+            throw new Error(prediction.error);
+        return prediction.results[0] as ChatCompletion | ChatCompletionChunk;
+    }
+}
diff --git a/src/beta/chat/index.ts b/src/beta/chat/index.ts
@@ -0,0 +1,6 @@
+/*
+*   Muna
+*   Copyright © 2025 NatML Inc. All Rights Reserved.
+*/
+
+export { ChatService } from "./chat"
diff --git a/src/beta/chat/types.ts b/src/beta/chat/types.ts
@@ -0,0 +1,156 @@
+/*
+*   Muna
+*   Copyright © 2025 NatML Inc. All Rights Reserved.
+*/
+
+export interface ChatCompletion {
+    /**
+     * The object type, which is always `chat.completion`.
+     */
+    object: "chat.completion";
+    /**
+     * A unique identifier for the chat completion.
+     */
+    id: string;
+    /**
+     * The model used for the chat completion.
+     */
+    model: string;
+    /**
+     * A list of chat completion choices. Can be more than one if `n` is greater
+     * than 1.
+     */
+    choices: Array<ChatCompletion.Choice>;
+    /**
+     * The Unix timestamp (in seconds) of when the chat completion was created.
+     */
+    created: number;
+    /**
+     * Usage statistics for the completion request.
+     */
+    usage?: CompletionUsage;
+}
+
+export interface ChatCompletionChunk {
+    /**
+     * The object type, which is always `chat.completion.chunk`.
+     */
+    object: "chat.completion.chunk";
+    /**
+     * A unique identifier for the chat completion. Each chunk has the same ID.
+     */
+    id: string;
+    /**
+     * The model to generate the completion.
+     */
+    model: string;
+    /**
+     * A list of chat completion choices. Can contain more than one elements if `n` is
+     * greater than 1. Can also be empty for the last chunk if you set
+     * `stream_options: {"include_usage": true}`.
+     */
+    choices: Array<ChatCompletionChunk.Choice>;
+    /**
+     * The Unix timestamp (in seconds) of when the chat completion was created. Each
+     * chunk has the same timestamp.
+     */
+    created: number;
+    /**
+     * Usage statistics for the completion request.
+     */
+    usage?: CompletionUsage;    
+}
+
+export namespace ChatCompletion {
+
+    export interface Choice {
+        /**
+         * The index of the choice in the list of choices.
+         */
+        index: number;
+        /**
+         * A chat completion message generated by the model.
+         */
+        message: ChatCompletionMessage;
+        /**
+         * The reason the model stopped generating tokens. This will be `stop` if the model
+         * hit a natural stop point or a provided stop sequence, `length` if the maximum
+         * number of tokens specified in the request was reached, `content_filter` if
+         * content was omitted due to a flag from our content filters, `tool_calls` if the
+         * model called a tool, or `function_call` (deprecated) if the model called a
+         * function.
+         */
+        finish_reason: "stop" | "length" | "tool_calls" | "content_filter" | "function_call";
+        /**
+         * Log probability information for the choice.
+         */
+        logprobs?: null;
+    }
+}
+
+export namespace ChatCompletionChunk {
+
+    export interface Choice {
+        /**
+         * The index of the choice in the list of choices.
+         */
+        index: number;
+        /**
+         * A chat completion delta generated by streamed model responses.
+         */
+        delta: Choice.Delta;
+        /**
+         * The reason the model stopped generating tokens. This will be `stop` if the model
+         * hit a natural stop point or a provided stop sequence, `length` if the maximum
+         * number of tokens specified in the request was reached, `content_filter` if
+         * content was omitted due to a flag from our content filters, `tool_calls` if the
+         * model called a tool, or `function_call` (deprecated) if the model called a
+         * function.
+         */
+        finish_reason: "stop" | "length" | "tool_calls" | "content_filter" | "function_call" | null;
+        /**
+         * Log probability information for the choice.
+         */
+        logprobs?: null;
+    }
+
+    export namespace Choice {
+
+        export interface Delta {
+            /**
+             * The role of the author of this message.
+             */
+            role?: "developer" | "system" | "user" | "assistant" | "tool";
+            /**
+             * The contents of the chunk message.
+             */
+            content?: string | null;
+        }
+    }
+}
+
+export interface ChatCompletionMessage {
+    /**
+     * The role of the author of this message.
+     */
+    role: "assistant" | "user" | "system";
+    /**
+     * The contents of the message.
+     */
+    content: string | null;
+}
+
+export interface CompletionUsage {
+    /**
+     * Number of tokens in the generated completion.
+     */
+    completion_tokens: number;
+    /**
+     * Number of tokens in the prompt.
+     */
+    prompt_tokens: number;
+    /**
+     * Total number of tokens used in the request (prompt + completion).
+     */
+    total_tokens: number;
+}
diff --git a/src/beta/client.ts b/src/beta/client.ts
@@ -4,6 +4,8 @@
 */
 
 import type { MunaClient } from "../client"
+import type { PredictionService as EdgePredictionService } from "../services"
+import { ChatService } from "./chat"
 import { PredictionService } from "./remote"
 
 /**
@@ -16,7 +18,13 @@ export class BetaClient {
      */
     public readonly predictions: PredictionService;
 
-    public constructor(client: MunaClient) {
+    /**
+     * Make chat conversations.
+     */
+    public readonly chat: ChatService;
+
+    public constructor(client: MunaClient, predictions: EdgePredictionService) {
         this.predictions = new PredictionService(client);
+        this.chat = new ChatService(predictions, this.predictions.remote);
     }
 }
diff --git a/src/beta/remote/prediction.ts b/src/beta/remote/prediction.ts
@@ -3,8 +3,8 @@
 *   Copyright © 2025 NatML Inc. All Rights Reserved.
 */
 
-import { RemotePredictionService } from "./remote"
 import type { MunaClient } from "../../client"
+import { RemotePredictionService } from "./remote"
 
 export class PredictionService {
 
diff --git a/src/beta/types.ts b/src/beta/types.ts
@@ -0,0 +1,7 @@
+/*
+*   Muna
+*   Copyright © 2025 NatML Inc. All Rights Reserved.
+*/
+
+export type { CreateRemotePredictionInput, RemoteAcceleration } from "./remote"
+export * from "./chat/types"
diff --git a/src/index.ts b/src/index.ts
@@ -3,7 +3,6 @@
 *   Copyright © 2025 NatML Inc. All Rights Reserved.
 */
 
-export type { CreateRemotePredictionInput, RemoteAcceleration } from "./beta"
 export type { MunaAPIError } from "./client"
 export * from "./muna"
 export * from "./types"
diff --git a/src/muna.ts b/src/muna.ts
@@ -58,6 +58,6 @@ export class Muna {
         this.users = new UserService(this.client);
         this.predictors = new PredictorService(this.client);
         this.predictions = new PredictionService(this.client);
-        this.beta = new BetaClient(this.client);
+        this.beta = new BetaClient(this.client, this.predictions);
     }
 }
diff --git a/test/chat.ts b/test/chat.ts

-Original file line number
+Diff line change
@@ @@ -0,0 +1,6 @@ @@
 +/*
 +*   Muna
 +*   Copyright © 2025 NatML Inc. All Rights Reserved.
 +*/
++
 +export { ChatService } from "./chat"