From e92b41b75bbe6879bc547b8b51888a69e98309ea Mon Sep 17 00:00:00 2001 From: Seb Duerr Date: Sun, 23 Nov 2025 16:57:06 -0800 Subject: [PATCH 1/2] feat: update Cerebras model list --- packages/types/src/providers/cerebras.ts | 30 ------------------------ 1 file changed, 30 deletions(-) diff --git a/packages/types/src/providers/cerebras.ts b/packages/types/src/providers/cerebras.ts index a027d6e8535..2868252fb49 100644 --- a/packages/types/src/providers/cerebras.ts +++ b/packages/types/src/providers/cerebras.ts @@ -15,26 +15,6 @@ export const cerebrasModels = { outputPrice: 0, description: "Highly intelligent general purpose model with up to 1,000 tokens/s", }, - "qwen-3-coder-480b-free": { - maxTokens: 40000, - contextWindow: 64000, - supportsImages: false, - supportsPromptCache: false, - inputPrice: 0, - outputPrice: 0, - description: - "[SOON TO BE DEPRECATED] SOTA coding model with ~2000 tokens/s ($0 free tier)\n\n• Use this if you don't have a Cerebras subscription\n• 64K context window\n• Rate limits: 150K TPM, 1M TPH/TPD, 10 RPM, 100 RPH/RPD\n\nUpgrade for higher limits: [https://cloud.cerebras.ai/?utm=roocode](https://cloud.cerebras.ai/?utm=roocode)", - }, - "qwen-3-coder-480b": { - maxTokens: 40000, - contextWindow: 128000, - supportsImages: false, - supportsPromptCache: false, - inputPrice: 0, - outputPrice: 0, - description: - "[SOON TO BE DEPRECATED] SOTA coding model with ~2000 tokens/s ($50/$250 paid tiers)\n\n• Use this if you have a Cerebras subscription\n• 131K context window with higher rate limits", - }, "qwen-3-235b-a22b-instruct-2507": { maxTokens: 64000, contextWindow: 64000, @@ -62,16 +42,6 @@ export const cerebrasModels = { outputPrice: 0, description: "SOTA coding performance with ~2500 tokens/s", }, - "qwen-3-235b-a22b-thinking-2507": { - maxTokens: 40000, - contextWindow: 65000, - supportsImages: false, - supportsPromptCache: false, - inputPrice: 0, - outputPrice: 0, - description: "SOTA performance with ~1500 tokens/s", - supportsReasoningEffort: true, - }, "gpt-oss-120b": { maxTokens: 8000, contextWindow: 64000, From a88cfe5d157f3585d9ef3c7946975fa1cad63657 Mon Sep 17 00:00:00 2001 From: Roo Code Date: Mon, 24 Nov 2025 01:26:20 +0000 Subject: [PATCH 2/2] refactor: remove dead code for deprecated Cerebras models --- src/api/providers/cerebras.ts | 14 +++----------- 1 file changed, 3 insertions(+), 11 deletions(-) diff --git a/src/api/providers/cerebras.ts b/src/api/providers/cerebras.ts index 16dfa282adb..b9ea00d6f97 100644 --- a/src/api/providers/cerebras.ts +++ b/src/api/providers/cerebras.ts @@ -98,19 +98,11 @@ export class CerebrasHandler extends BaseProvider implements SingleCompletionHan } getModel(): { id: CerebrasModelId; info: (typeof cerebrasModels)[CerebrasModelId] } { - const originalModelId = (this.options.apiModelId as CerebrasModelId) || this.defaultProviderModelId - - // Route both qwen coder models to the same actual model ID for API calls - // This allows them to have different rate limits/descriptions in the UI - // while using the same underlying model - let apiModelId = originalModelId - if (originalModelId === "qwen-3-coder-480b-free") { - apiModelId = "qwen-3-coder-480b" - } + const modelId = (this.options.apiModelId as CerebrasModelId) || this.defaultProviderModelId return { - id: apiModelId, - info: this.providerModels[originalModelId], // Use original model info for rate limits/descriptions + id: modelId, + info: this.providerModels[modelId], } }