vor 5 Monaten · 38c6c7a101
--- a/packages/types/src/providers/chutes.ts
+++ b/packages/types/src/providers/chutes.ts
@@ -26,6 +26,7 @@ export type ChutesModelId =
 
				 	| "microsoft/MAI-DS-R1-FP8"
			
 
				 	| "tngtech/DeepSeek-R1T-Chimera"
			
 
				 	| "zai-org/GLM-4.5-Air"
			
 
				+	| "zai-org/GLM-4.5-FP8"
			
 
				 
			
 
				 export const chutesDefaultModelId: ChutesModelId = "deepseek-ai/DeepSeek-R1-0528"
			
 
				 
			
@@ -247,4 +248,14 @@ export const chutesModels = {
 
				 		description:
			
 
				 			"GLM-4.5-Air model with 151,329 token context window and 106B total parameters with 12B activated.",
			
 
				 	},
			
 
				+	"zai-org/GLM-4.5-FP8": {
			
 
				+		maxTokens: 32768,
			
 
				+		contextWindow: 131072,
			
 
				+		supportsImages: false,
			
 
				+		supportsPromptCache: false,
			
 
				+		inputPrice: 0,
			
 
				+		outputPrice: 0,
			
 
				+		description:
			
 
				+			"GLM-4.5-FP8 model with 128k token context window, optimized for agent-based applications with MoE architecture.",
			
 
				+	},
			
 
				 } as const satisfies Record<string, ModelInfo>
			
--- a/src/api/providers/__tests__/chutes.spec.ts
+++ b/src/api/providers/__tests__/chutes.spec.ts
@@ -208,6 +208,29 @@ describe("ChutesHandler", () => {
 
				 		)
			
 
				 	})
			
 
				 
			
 
				+	it("should return zai-org/GLM-4.5-FP8 model with correct configuration", () => {
			
 
				+		const testModelId: ChutesModelId = "zai-org/GLM-4.5-FP8"
			
 
				+		const handlerWithModel = new ChutesHandler({
			
 
				+			apiModelId: testModelId,
			
 
				+			chutesApiKey: "test-chutes-api-key",
			
 
				+		})
			
 
				+		const model = handlerWithModel.getModel()
			
 
				+		expect(model.id).toBe(testModelId)
			
 
				+		expect(model.info).toEqual(
			
 
				+			expect.objectContaining({
			
 
				+				maxTokens: 32768,
			
 
				+				contextWindow: 131072,
			
 
				+				supportsImages: false,
			
 
				+				supportsPromptCache: false,
			
 
				+				inputPrice: 0,
			
 
				+				outputPrice: 0,
			
 
				+				description:
			
 
				+					"GLM-4.5-FP8 model with 128k token context window, optimized for agent-based applications with MoE architecture.",
			
 
				+				temperature: 0.5, // Default temperature for non-DeepSeek models
			
 
				+			}),
			
 
				+		)
			
 
				+	})
			
 
				+
			
 
				 	it("completePrompt method should return text from Chutes API", async () => {
			
 
				 		const expectedResponse = "This is a test response from Chutes"
			
 
				 		mockCreate.mockResolvedValueOnce({ choices: [{ message: { content: expectedResponse } }] })