|
|
@@ -15,7 +15,19 @@ export const cerebrasModels = {
|
|
|
defaultToolProtocol: "native",
|
|
|
inputPrice: 0,
|
|
|
outputPrice: 0,
|
|
|
- description: "Highly intelligent general purpose model with up to 1,000 tokens/s",
|
|
|
+ description: "Fast general-purpose model on Cerebras (up to 1,000 tokens/s). To be deprecated soon.",
|
|
|
+ },
|
|
|
+ "zai-glm-4.7": {
|
|
|
+ maxTokens: 16384, // Conservative default to avoid premature rate limiting (Cerebras reserves quota upfront)
|
|
|
+ contextWindow: 131072,
|
|
|
+ supportsImages: false,
|
|
|
+ supportsPromptCache: false,
|
|
|
+ supportsNativeTools: true,
|
|
|
+ defaultToolProtocol: "native",
|
|
|
+ inputPrice: 0,
|
|
|
+ outputPrice: 0,
|
|
|
+ description:
|
|
|
+ "Highly capable general-purpose model on Cerebras (up to 1,000 tokens/s), competitive with leading proprietary models on coding tasks.",
|
|
|
},
|
|
|
"qwen-3-235b-a22b-instruct-2507": {
|
|
|
maxTokens: 16384, // Conservative default to avoid premature rate limiting
|