Skip to content

Commit becdb1a

Browse files
feat: update Cerebras models (#9527)
Co-authored-by: Roo Code <[email protected]>
1 parent b531075 commit becdb1a

File tree

2 files changed

+3
-41
lines changed

2 files changed

+3
-41
lines changed

packages/types/src/providers/cerebras.ts

Lines changed: 0 additions & 30 deletions
Original file line numberDiff line numberDiff line change
@@ -15,26 +15,6 @@ export const cerebrasModels = {
1515
outputPrice: 0,
1616
description: "Highly intelligent general purpose model with up to 1,000 tokens/s",
1717
},
18-
"qwen-3-coder-480b-free": {
19-
maxTokens: 40000,
20-
contextWindow: 64000,
21-
supportsImages: false,
22-
supportsPromptCache: false,
23-
inputPrice: 0,
24-
outputPrice: 0,
25-
description:
26-
"[SOON TO BE DEPRECATED] SOTA coding model with ~2000 tokens/s ($0 free tier)\n\n• Use this if you don't have a Cerebras subscription\n• 64K context window\n• Rate limits: 150K TPM, 1M TPH/TPD, 10 RPM, 100 RPH/RPD\n\nUpgrade for higher limits: [https://cloud.cerebras.ai/?utm=roocode](https://cloud.cerebras.ai/?utm=roocode)",
27-
},
28-
"qwen-3-coder-480b": {
29-
maxTokens: 40000,
30-
contextWindow: 128000,
31-
supportsImages: false,
32-
supportsPromptCache: false,
33-
inputPrice: 0,
34-
outputPrice: 0,
35-
description:
36-
"[SOON TO BE DEPRECATED] SOTA coding model with ~2000 tokens/s ($50/$250 paid tiers)\n\n• Use this if you have a Cerebras subscription\n• 131K context window with higher rate limits",
37-
},
3818
"qwen-3-235b-a22b-instruct-2507": {
3919
maxTokens: 64000,
4020
contextWindow: 64000,
@@ -62,16 +42,6 @@ export const cerebrasModels = {
6242
outputPrice: 0,
6343
description: "SOTA coding performance with ~2500 tokens/s",
6444
},
65-
"qwen-3-235b-a22b-thinking-2507": {
66-
maxTokens: 40000,
67-
contextWindow: 65000,
68-
supportsImages: false,
69-
supportsPromptCache: false,
70-
inputPrice: 0,
71-
outputPrice: 0,
72-
description: "SOTA performance with ~1500 tokens/s",
73-
supportsReasoningEffort: true,
74-
},
7545
"gpt-oss-120b": {
7646
maxTokens: 8000,
7747
contextWindow: 64000,

src/api/providers/cerebras.ts

Lines changed: 3 additions & 11 deletions
Original file line numberDiff line numberDiff line change
@@ -98,19 +98,11 @@ export class CerebrasHandler extends BaseProvider implements SingleCompletionHan
9898
}
9999

100100
getModel(): { id: CerebrasModelId; info: (typeof cerebrasModels)[CerebrasModelId] } {
101-
const originalModelId = (this.options.apiModelId as CerebrasModelId) || this.defaultProviderModelId
102-
103-
// Route both qwen coder models to the same actual model ID for API calls
104-
// This allows them to have different rate limits/descriptions in the UI
105-
// while using the same underlying model
106-
let apiModelId = originalModelId
107-
if (originalModelId === "qwen-3-coder-480b-free") {
108-
apiModelId = "qwen-3-coder-480b"
109-
}
101+
const modelId = (this.options.apiModelId as CerebrasModelId) || this.defaultProviderModelId
110102

111103
return {
112-
id: apiModelId,
113-
info: this.providerModels[originalModelId], // Use original model info for rate limits/descriptions
104+
id: modelId,
105+
info: this.providerModels[modelId],
114106
}
115107
}
116108

0 commit comments

Comments
 (0)