feat: add Cerebras model provider support and SDK integration

lancewilhelm · lancewilhelm · commit 2b54089381e2 · 2025-08-06T21:45:02.000-04:00
- Add Cerebras to supported providers in README and config
- Add Cerebras icon and update icon utilities
- Integrate @cerebras/cerebras_cloud_sdk dependency
- Implement Cerebras model fetching and completion (streaming &amp;
  non-streaming)
- Expose Cerebras in provider APIs and server logic
- Refactor debounce sync utility for dynamic import
diff --git a/README.md b/README.md
@@ -21,6 +21,7 @@ A clean and simple front-end for large-language models.
   - OpenAI
   - Gemini
   - Anthropic
+  - Cerebras
 - Themes and fun things
 
 ## Usage
@@ -44,6 +45,7 @@ To use a remote provider api for llm inference, you can set an environmental var
 - `NUXT_OPENAI_API_KEY` for OpenAI
 - `NUXT_GEMINI_API_KEY` for Gemini
 - `NUXT_ANTHROPIC_API_KEY` for Anthropic
+- `NUXT_CEREBRAS_API_KEY` for Cerebras
 
 ##### Example
 
@@ -100,6 +102,7 @@ AUTH_SECRET=
 OPENAI_API_KEY=
 GEMINI_API_KEY=
 ANTHROPIC_API_KEY=
+CEREBRAS_API_KEY=
 ```
 
 4. Run the app
diff --git a/app/assets/icons/cerebras.svg b/app/assets/icons/cerebras.svg
@@ -0,0 +1 @@
+<svg fill="currentColor" fill-rule="evenodd" height="1em" style="flex:none;line-height:1" viewBox="0 0 24 24" width="1em" xmlns="http://www.w3.org/2000/svg"><title>Cerebras</title><path clip-rule="evenodd" d="M14.121 2.701a9.299 9.299 0 000 18.598V22.7c-5.91 0-10.7-4.791-10.7-10.701S8.21 1.299 14.12 1.299V2.7zm4.752 3.677A7.353 7.353 0 109.42 17.643l-.901 1.074a8.754 8.754 0 01-1.08-12.334 8.755 8.755 0 0112.335-1.08l-.901 1.075zm-2.255.844a5.407 5.407 0 00-5.048 9.563l-.656 1.24a6.81 6.81 0 016.358-12.043l-.654 1.24zM14.12 8.539a3.46 3.46 0 100 6.922v1.402a4.863 4.863 0 010-9.726v1.402z"></path><path d="M15.407 10.836a2.24 2.24 0 00-.51-.409 1.084 1.084 0 00-.544-.152c-.255 0-.483.047-.684.14a1.58 1.58 0 00-.84.912c-.074.203-.11.416-.11.631 0 .218.036.43.11.631a1.594 1.594 0 00.84.913c.2.093.43.14.684.14.216 0 .417-.046.602-.135.188-.09.35-.225.475-.392l.928 1.006c-.14.14-.3.261-.482.363a3.367 3.367 0 01-1.083.38c-.17.026-.317.04-.44.04a3.315 3.315 0 01-1.182-.21 2.825 2.825 0 01-.961-.597 2.816 2.816 0 01-.644-.929 2.987 2.987 0 01-.238-1.21c0-.444.08-.847.238-1.21.15-.35.368-.666.643-.929.278-.261.605-.464.962-.596a3.315 3.315 0 011.182-.21c.355 0 .712.068 1.072.204.361.138.685.36.944.649l-.962.97z"></path></svg>
diff --git a/app/utils/icon.ts b/app/utils/icon.ts
@@ -7,6 +7,7 @@ export function getModelProviderIcon(provider?: string) {
     openai: "simple-icons:openai",
     anthropic: "simple-icons:anthropic",
     lmstudio: "local:lmstudio",
+    cerebras: "local:cerebras",
   };
   return modelIcons[provider] || "";
 }
diff --git a/app/utils/llm/providers.ts b/app/utils/llm/providers.ts
@@ -10,6 +10,7 @@ export const providers: ProviderMeta[] = [
   { id: "openai", displayName: "OpenAI", icon: "simple-icons:openai" },
   { id: "gemini", displayName: "Gemini", icon: "simple-icons:googlegemini" },
   { id: "anthropic", displayName: "Anthropic", icon: "simple-icons:anthropic" },
+  { id: "cerebras", displayName: "Cerebras", icon: "local:cerebras" },
   {
     id: "lmstudio",
     displayName: "LM Studio",
diff --git a/app/utils/sync/debounce.ts b/app/utils/sync/debounce.ts
@@ -1,13 +1,24 @@
-import { useSyncStore } from "~/stores/sync";
 import { debounce } from "../debounce";
 
 const DEBOUNCE_MS = 500;
 
-const _triggerSync = () => {
-  const sync = useSyncStore();
-  if (!sync.isSyncing) {
-    sync.sync();
+let _debouncedSync: (() => void) | null = null;
+
+export const triggerDebouncedSync = () => {
+  // Lazy initialization to avoid store access during module load
+  if (!_debouncedSync) {
+    const _triggerSync = () => {
+      // Import store only when actually needed using dynamic import
+      import("~/stores/sync").then(({ useSyncStore }) => {
+        const sync = useSyncStore();
+        if (!sync.isSyncing) {
+          sync.sync();
+        }
+      });
+    };
+
+    _debouncedSync = debounce(_triggerSync, DEBOUNCE_MS);
   }
-};
 
-export const triggerDebouncedSync = debounce(_triggerSync, DEBOUNCE_MS);
+  _debouncedSync();
+};
diff --git a/nuxt.config.ts b/nuxt.config.ts
@@ -36,6 +36,7 @@ export default defineNuxtConfig({
     openaiApiKey: process.env.OPENAI_API_KEY || "",
     geminiApiKey: process.env.GEMINI_API_KEY || "",
     anthropicApiKey: process.env.ANTHROPIC_API_KEY || "",
+    cerebrasApiKey: process.env.CEREBRAS_API_KEY || "",
     public: {
       debug: false,
       appVersion: "",
diff --git a/package.json b/package.json
@@ -20,6 +20,7 @@
   },
   "dependencies": {
     "@anthropic-ai/sdk": "^0.40.1",
+    "@cerebras/cerebras_cloud_sdk": "^1.46.0",
     "@google/genai": "^0.12.0",
     "@lancedb/lancedb": "^0.19.0",
     "@libsql/client": "^0.15.4",
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
diff --git a/server/api/providers/index.get.ts b/server/api/providers/index.get.ts
@@ -3,6 +3,8 @@ import { auth } from "@/utils/auth";
 import { globalSettings } from "~/utils/db/schema";
 import { and, eq, type InferSelectModel } from "drizzle-orm";
 import type { GlobalSettings } from "~/stores/globalSettings";
+import { getLMStudioClient } from "~~/server/utils/llm/completionLMStudio";
+import { cloudDb } from "~~/server/utils/db/cloud";
 
 export default defineEventHandler(async (event) => {
   logger.debug("GET /api/providers");
@@ -35,6 +37,10 @@ export default defineEventHandler(async (event) => {
   if (config.anthropicApiKey) {
     providers.push("anthropic");
   }
+  // Cerebras
+  if (config.cerebrasApiKey) {
+    providers.push("cerebras");
+  }
   // LM Studio
   const lmStudio = getLMStudioClient();
   const lmStudioVersion = await lmStudio.system.getLMStudioVersion();
diff --git a/server/utils/llm/completionCerebras.ts b/server/utils/llm/completionCerebras.ts
@@ -0,0 +1,157 @@
+import { logger } from "~/utils/logger";
+import Cerebras from "@cerebras/cerebras_cloud_sdk";
+import type { LocalMessage, Usage, Model } from "~/utils/db/local";
+
+// Client generator
+export function getCerebrasClient() {
+  const config = useRuntimeConfig();
+  const apiKey = config.cerebrasApiKey;
+  if (!apiKey) {
+    throw new Error("Missing CEREBRAS_API_KEY");
+  }
+  return new Cerebras({ apiKey });
+}
+
+// Fetch models
+export async function fetchCerebrasModels() {
+  const cerebras = getCerebrasClient();
+
+  try {
+    const modelsList = await cerebras.models.list();
+    const models: Model[] = modelsList.data.map((model) => ({
+      name: model.id,
+      displayName:
+        model.id.charAt(0).toUpperCase() +
+        model.id.slice(1).replace(/[-.]/g, " "),
+      provider: "cerebras",
+    }));
+
+    return models;
+  } catch (error) {
+    logger.error(error, "GET /api/models/cerebras: Error fetching models");
+    throw new Error("Failed to fetch models");
+  }
+}
+
+// Non-streaming completion
+export async function completionCerebras({
+  history,
+  model,
+  systemPrompt,
+}: {
+  history: LocalMessage[];
+  model: string;
+  systemPrompt: string;
+}) {
+  const cerebras = getCerebrasClient();
+
+  try {
+    const formattedMessages = history.map((msg) => ({
+      role: msg.role as "user" | "assistant",
+      content: msg.content,
+    }));
+
+    const params = {
+      messages: [
+        { role: "system" as const, content: systemPrompt },
+        ...formattedMessages,
+      ],
+      model,
+    };
+
+    const completion = await cerebras.chat.completions.create(params);
+    // eslint-disable-next-line @typescript-eslint/no-explicit-any
+    const content = (completion as any).choices[0]?.message?.content;
+    return content;
+  } catch (error) {
+    logger.error(error, "Error getting completion from Cerebras");
+    throw new Error("Internal server error");
+  }
+}
+
+// Streaming completion
+export async function streamCerebras({
+  history,
+  model,
+  systemPrompt,
+}: {
+  history: LocalMessage[];
+  model: string;
+  systemPrompt: string;
+}): Promise<ReadableStream> {
+  const cerebras = getCerebrasClient();
+  const encoder = new TextEncoder();
+
+  const stream = new ReadableStream({
+    async start(controller) {
+      try {
+        const formattedMessages = [
+          { role: "system" as const, content: systemPrompt },
+          ...history.map((msg) => ({
+            role: msg.role as "user" | "assistant",
+            content: msg.content,
+          })),
+        ];
+
+        const queryStartTime = performance.now();
+        let timeToFirstToken = 0;
+        let responseStartTime = 0;
+
+        const completion = await cerebras.chat.completions.create({
+          model: model,
+          messages: formattedMessages,
+          stream: true,
+        });
+
+        // eslint-disable-next-line @typescript-eslint/no-explicit-any
+        let usageChunk: any;
+        for await (const chunk of completion) {
+          if (!timeToFirstToken) {
+            timeToFirstToken = performance.now() - queryStartTime;
+            responseStartTime = performance.now();
+          }
+          // eslint-disable-next-line @typescript-eslint/no-explicit-any
+          const text = (chunk as any).choices[0]?.delta?.content || "";
+          controller.enqueue(
+            encoder.encode(
+              `event: messageChunk\ndata: ${JSON.stringify(text)}\n\n`,
+            ),
+          );
+          // eslint-disable-next-line @typescript-eslint/no-explicit-any
+          if ((chunk as any).usage) {
+            // eslint-disable-next-line @typescript-eslint/no-explicit-any
+            usageChunk = (chunk as any).usage;
+          }
+        }
+
+        if (usageChunk) {
+          const completionTime = performance.now() - responseStartTime;
+          const usage: Usage | Partial<Usage> = {
+            promptTokens: usageChunk.prompt_tokens,
+            completionTokens: usageChunk.completion_tokens,
+            totalTokens: usageChunk.total_tokens,
+            completionTime,
+            tokensPerSecond:
+              (usageChunk.completion_tokens / completionTime) * 1000,
+            timeToFirstToken,
+            temperature: 1,
+          };
+          controller.enqueue(
+            encoder.encode(`event: usage\ndata: ${JSON.stringify(usage)}\n\n`),
+          );
+        }
+      } catch (error) {
+        logger.error(error, "Error streaming Cerebras");
+        controller.enqueue(
+          encoder.encode(
+            `event: error\ndata: Error streaming Cerebras: ${error}\n\n`,
+          ),
+        );
+      } finally {
+        controller.close();
+      }
+    },
+  });
+
+  return stream;
+}
diff --git a/server/utils/llm/providers.ts b/server/utils/llm/providers.ts
@@ -24,6 +24,11 @@ import {
   completionOllama,
   streamOllama,
 } from "~~/server/utils/llm/completionOllama";
+import {
+  fetchCerebrasModels,
+  completionCerebras,
+  streamCerebras,
+} from "~~/server/utils/llm/completionCerebras";
 
 export interface LLMProvider {
   id: string;
@@ -116,4 +121,18 @@ export const providers: Record<string, LLMProvider> = {
         url,
       }),
   },
+  cerebras: {
+    id: "cerebras",
+    displayName: "Cerebras",
+    icon: "local:cerebras",
+    fetchModels: fetchCerebrasModels,
+    complete: async ({ history, model, systemPrompt }) =>
+      completionCerebras({ history, model, systemPrompt }),
+    stream: async ({ history, model, systemPrompt }) =>
+      streamCerebras({
+        history,
+        model,
+        systemPrompt,
+      }),
+  },
 };

Original file line number	Diff line number	Diff line change
`@@ -7,6 +7,7 @@ export function getModelProviderIcon(provider?: string) {`
`7`	`7`	`openai: "simple-icons:openai",`
`8`	`8`	`anthropic: "simple-icons:anthropic",`
`9`	`9`	`lmstudio: "local:lmstudio",`
	`10`	`+ cerebras: "local:cerebras",`
`10`	`11`	`};`
`11`	`12`	`return modelIcons[provider] \|\| "";`
`12`	`13`	`}`
Original file line number	Diff line number	Diff line change
`@@ -10,6 +10,7 @@ export const providers: ProviderMeta[] = [`
`10`	`10`	`{ id: "openai", displayName: "OpenAI", icon: "simple-icons:openai" },`
`11`	`11`	`{ id: "gemini", displayName: "Gemini", icon: "simple-icons:googlegemini" },`
`12`	`12`	`{ id: "anthropic", displayName: "Anthropic", icon: "simple-icons:anthropic" },`
	`13`	`+ { id: "cerebras", displayName: "Cerebras", icon: "local:cerebras" },`
`13`	`14`	`{`
`14`	`15`	`id: "lmstudio",`
`15`	`16`	`displayName: "LM Studio",`