Skip to content

Commit 3bfc711

Browse files
authored
Merge pull request #3437 from Kilo-Org/christiaan/cerebras
Add zai-glm-4.6 model to Cerebras and set gpt-oss-120b as default
2 parents 3093b8e + 829f052 commit 3bfc711

File tree

3 files changed

+18
-4
lines changed

3 files changed

+18
-4
lines changed

.changeset/puny-coins-unite.md

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,5 @@
1+
---
2+
"kilo-code": patch
3+
---
4+
5+
Add zai-glm-4.6 model to Cerebras and set gpt-oss-120b as default (thanks Roo)

packages/types/src/providers/cerebras.ts

Lines changed: 12 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,18 @@ import type { ModelInfo } from "../model.js"
33
// https://inference-docs.cerebras.ai/api-reference/chat-completions
44
export type CerebrasModelId = keyof typeof cerebrasModels
55

6-
export const cerebrasDefaultModelId: CerebrasModelId = "qwen-3-coder-480b-free"
6+
export const cerebrasDefaultModelId: CerebrasModelId = "gpt-oss-120b"
77

88
export const cerebrasModels = {
9+
"zai-glm-4.6": {
10+
maxTokens: 16_384,
11+
contextWindow: 128000,
12+
supportsImages: false,
13+
supportsPromptCache: false,
14+
inputPrice: 0,
15+
outputPrice: 0,
16+
description: "Highly intelligent general-purpose model with ~2000 tokens/s",
17+
},
918
"qwen-3-coder-480b-free": {
1019
maxTokens: 40000,
1120
contextWindow: 64000,
@@ -14,7 +23,7 @@ export const cerebrasModels = {
1423
inputPrice: 0,
1524
outputPrice: 0,
1625
description:
17-
"SOTA coding model with ~2000 tokens/s ($0 free tier)\n\n• Use this if you don't have a Cerebras subscription\n• 64K context window\n• Rate limits: 150K TPM, 1M TPH/TPD, 10 RPM, 100 RPH/RPD\n\nUpgrade for higher limits: [https://cloud.cerebras.ai/?utm=roocode](https://cloud.cerebras.ai/?utm=roocode)",
26+
"[SOON TO BE DEPRECATED] SOTA coding model with ~2000 tokens/s ($0 free tier)\n\n• Use this if you don't have a Cerebras subscription\n• 64K context window\n• Rate limits: 150K TPM, 1M TPH/TPD, 10 RPM, 100 RPH/RPD\n\nUpgrade for higher limits: [https://cloud.cerebras.ai/?utm=roocode](https://cloud.cerebras.ai/?utm=roocode)",
1827
},
1928
"qwen-3-coder-480b": {
2029
maxTokens: 40000,
@@ -24,7 +33,7 @@ export const cerebrasModels = {
2433
inputPrice: 0,
2534
outputPrice: 0,
2635
description:
27-
"SOTA coding model with ~2000 tokens/s ($50/$250 paid tiers)\n\n• Use this if you have a Cerebras subscription\n• 131K context window with higher rate limits",
36+
"[SOON TO BE DEPRECATED] SOTA coding model with ~2000 tokens/s ($50/$250 paid tiers)\n\n• Use this if you have a Cerebras subscription\n• 131K context window with higher rate limits",
2837
},
2938
"qwen-3-235b-a22b-instruct-2507": {
3039
maxTokens: 64000,

src/api/providers/__tests__/cerebras.spec.ts

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -56,7 +56,7 @@ describe("CerebrasHandler", () => {
5656
it("should fallback to default model when apiModelId is not provided", () => {
5757
const handlerWithoutModel = new CerebrasHandler({ cerebrasApiKey: "test" })
5858
const { id } = handlerWithoutModel.getModel()
59-
expect(id).toBe("qwen-3-coder-480b") // cerebrasDefaultModelId (routed)
59+
expect(id).toBe("gpt-oss-120b") // cerebrasDefaultModelId
6060
})
6161
})
6262

0 commit comments

Comments
 (0)