add centml

V2arK · V2arK · commit 345291632cf2 · 2025-04-28T11:05:42.000-06:00
diff --git a/packages/inference/src/providers/centml.ts b/packages/inference/src/providers/centml.ts
@@ -0,0 +1,66 @@
+/**
+ * CentML provider implementation for serverless inference.
+ * This provider supports chat completions and text generation through CentML's serverless endpoints.
+ */
+import type { ChatCompletionOutput, TextGenerationOutput } from "@huggingface/tasks";
+import { InferenceOutputError } from "../lib/InferenceOutputError";
+import type { BodyParams } from "../types";
+import { BaseConversationalTask, BaseTextGenerationTask } from "./providerHelper";
+
+const CENTML_API_BASE_URL = "https://api.centml.ai";
+
+export class CentMLConversationalTask extends BaseConversationalTask {
+    constructor() {
+        super("centml", CENTML_API_BASE_URL);
+    }
+
+    override preparePayload(params: BodyParams): Record<string, unknown> {
+        const { args, model } = params;
+        return {
+            ...args,
+            model,
+            api_key: args.accessToken, // Use the accessToken from args
+        };
+    }
+
+    override async getResponse(response: ChatCompletionOutput): Promise<ChatCompletionOutput> {
+        if (
+            typeof response === "object" &&
+            Array.isArray(response?.choices) &&
+            typeof response?.created === "number" &&
+            typeof response?.id === "string" &&
+            typeof response?.model === "string" &&
+            typeof response?.usage === "object"
+        ) {
+            return response;
+        }
+
+        throw new InferenceOutputError("Expected ChatCompletionOutput");
+    }
+}
+
+export class CentMLTextGenerationTask extends BaseTextGenerationTask {
+    constructor() {
+        super("centml", CENTML_API_BASE_URL);
+    }
+
+    override preparePayload(params: BodyParams): Record<string, unknown> {
+        const { args, model } = params;
+        return {
+            ...args,
+            model,
+            api_key: args.accessToken, // Use the accessToken from args
+        };
+    }
+
+    override async getResponse(response: TextGenerationOutput): Promise<TextGenerationOutput> {
+        if (
+            typeof response === "object" &&
+            typeof response?.generated_text === "string"
+        ) {
+            return response;
+        }
+
+        throw new InferenceOutputError("Expected TextGenerationOutput");
+    }
+} 
diff --git a/packages/inference/src/types.ts b/packages/inference/src/types.ts
@@ -40,6 +40,7 @@ export type InferenceTask = Exclude<PipelineType, "other"> | "conversational";
 export const INFERENCE_PROVIDERS = [
 	"black-forest-labs",
 	"cerebras",
+	"centml",
 	"cohere",
 	"fal-ai",
 	"featherless-ai",