|
@@ -12,7 +12,7 @@ export type InternationalZAiModelId = keyof typeof internationalZAiModels
|
|
|
export const internationalZAiDefaultModelId: InternationalZAiModelId = "glm-4.6"
|
|
export const internationalZAiDefaultModelId: InternationalZAiModelId = "glm-4.6"
|
|
|
export const internationalZAiModels = {
|
|
export const internationalZAiModels = {
|
|
|
"glm-4.5": {
|
|
"glm-4.5": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -26,7 +26,7 @@ export const internationalZAiModels = {
|
|
|
"GLM-4.5 is Zhipu's latest featured model. Its comprehensive capabilities in reasoning, coding, and agent reach the state-of-the-art (SOTA) level among open-source models, with a context length of up to 128k.",
|
|
"GLM-4.5 is Zhipu's latest featured model. Its comprehensive capabilities in reasoning, coding, and agent reach the state-of-the-art (SOTA) level among open-source models, with a context length of up to 128k.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-air": {
|
|
"glm-4.5-air": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -40,7 +40,7 @@ export const internationalZAiModels = {
|
|
|
"GLM-4.5-Air is the lightweight version of GLM-4.5. It balances performance and cost-effectiveness, and can flexibly switch to hybrid thinking models.",
|
|
"GLM-4.5-Air is the lightweight version of GLM-4.5. It balances performance and cost-effectiveness, and can flexibly switch to hybrid thinking models.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-x": {
|
|
"glm-4.5-x": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -54,7 +54,7 @@ export const internationalZAiModels = {
|
|
|
"GLM-4.5-X is a high-performance variant optimized for strong reasoning with ultra-fast responses.",
|
|
"GLM-4.5-X is a high-performance variant optimized for strong reasoning with ultra-fast responses.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-airx": {
|
|
"glm-4.5-airx": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -67,7 +67,7 @@ export const internationalZAiModels = {
|
|
|
description: "GLM-4.5-AirX is a lightweight, ultra-fast variant delivering strong performance with lower cost.",
|
|
description: "GLM-4.5-AirX is a lightweight, ultra-fast variant delivering strong performance with lower cost.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-flash": {
|
|
"glm-4.5-flash": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -94,7 +94,7 @@ export const internationalZAiModels = {
|
|
|
"GLM-4.5V is Z.AI's multimodal visual reasoning model (image/video/text/file input), optimized for GUI tasks, grounding, and document/video understanding.",
|
|
"GLM-4.5V is Z.AI's multimodal visual reasoning model (image/video/text/file input), optimized for GUI tasks, grounding, and document/video understanding.",
|
|
|
},
|
|
},
|
|
|
"glm-4.6": {
|
|
"glm-4.6": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 200_000,
|
|
contextWindow: 200_000,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -107,8 +107,25 @@ export const internationalZAiModels = {
|
|
|
description:
|
|
description:
|
|
|
"GLM-4.6 is Zhipu's newest model with an extended context window of up to 200k tokens, providing enhanced capabilities for processing longer documents and conversations.",
|
|
"GLM-4.6 is Zhipu's newest model with an extended context window of up to 200k tokens, providing enhanced capabilities for processing longer documents and conversations.",
|
|
|
},
|
|
},
|
|
|
|
|
+ "glm-4.7": {
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
|
|
+ contextWindow: 200_000,
|
|
|
|
|
+ supportsImages: false,
|
|
|
|
|
+ supportsPromptCache: true,
|
|
|
|
|
+ supportsNativeTools: true,
|
|
|
|
|
+ defaultToolProtocol: "native",
|
|
|
|
|
+ supportsReasoningEffort: ["disable", "medium"],
|
|
|
|
|
+ reasoningEffort: "medium",
|
|
|
|
|
+ preserveReasoning: true,
|
|
|
|
|
+ inputPrice: 0.6,
|
|
|
|
|
+ outputPrice: 2.2,
|
|
|
|
|
+ cacheWritesPrice: 0,
|
|
|
|
|
+ cacheReadsPrice: 0.11,
|
|
|
|
|
+ description:
|
|
|
|
|
+ "GLM-4.7 is Zhipu's latest model with built-in thinking capabilities enabled by default. It provides enhanced reasoning for complex tasks while maintaining fast response times.",
|
|
|
|
|
+ },
|
|
|
"glm-4-32b-0414-128k": {
|
|
"glm-4-32b-0414-128k": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: false,
|
|
supportsPromptCache: false,
|
|
@@ -126,7 +143,7 @@ export type MainlandZAiModelId = keyof typeof mainlandZAiModels
|
|
|
export const mainlandZAiDefaultModelId: MainlandZAiModelId = "glm-4.6"
|
|
export const mainlandZAiDefaultModelId: MainlandZAiModelId = "glm-4.6"
|
|
|
export const mainlandZAiModels = {
|
|
export const mainlandZAiModels = {
|
|
|
"glm-4.5": {
|
|
"glm-4.5": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -140,7 +157,7 @@ export const mainlandZAiModels = {
|
|
|
"GLM-4.5 is Zhipu's latest featured model. Its comprehensive capabilities in reasoning, coding, and agent reach the state-of-the-art (SOTA) level among open-source models, with a context length of up to 128k.",
|
|
"GLM-4.5 is Zhipu's latest featured model. Its comprehensive capabilities in reasoning, coding, and agent reach the state-of-the-art (SOTA) level among open-source models, with a context length of up to 128k.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-air": {
|
|
"glm-4.5-air": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -154,7 +171,7 @@ export const mainlandZAiModels = {
|
|
|
"GLM-4.5-Air is the lightweight version of GLM-4.5. It balances performance and cost-effectiveness, and can flexibly switch to hybrid thinking models.",
|
|
"GLM-4.5-Air is the lightweight version of GLM-4.5. It balances performance and cost-effectiveness, and can flexibly switch to hybrid thinking models.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-x": {
|
|
"glm-4.5-x": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -168,7 +185,7 @@ export const mainlandZAiModels = {
|
|
|
"GLM-4.5-X is a high-performance variant optimized for strong reasoning with ultra-fast responses.",
|
|
"GLM-4.5-X is a high-performance variant optimized for strong reasoning with ultra-fast responses.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-airx": {
|
|
"glm-4.5-airx": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -181,7 +198,7 @@ export const mainlandZAiModels = {
|
|
|
description: "GLM-4.5-AirX is a lightweight, ultra-fast variant delivering strong performance with lower cost.",
|
|
description: "GLM-4.5-AirX is a lightweight, ultra-fast variant delivering strong performance with lower cost.",
|
|
|
},
|
|
},
|
|
|
"glm-4.5-flash": {
|
|
"glm-4.5-flash": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 131_072,
|
|
contextWindow: 131_072,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -208,7 +225,7 @@ export const mainlandZAiModels = {
|
|
|
"GLM-4.5V is Z.AI's multimodal visual reasoning model (image/video/text/file input), optimized for GUI tasks, grounding, and document/video understanding.",
|
|
"GLM-4.5V is Z.AI's multimodal visual reasoning model (image/video/text/file input), optimized for GUI tasks, grounding, and document/video understanding.",
|
|
|
},
|
|
},
|
|
|
"glm-4.6": {
|
|
"glm-4.6": {
|
|
|
- maxTokens: 98_304,
|
|
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
contextWindow: 204_800,
|
|
contextWindow: 204_800,
|
|
|
supportsImages: false,
|
|
supportsImages: false,
|
|
|
supportsPromptCache: true,
|
|
supportsPromptCache: true,
|
|
@@ -221,6 +238,23 @@ export const mainlandZAiModels = {
|
|
|
description:
|
|
description:
|
|
|
"GLM-4.6 is Zhipu's newest model with an extended context window of up to 200k tokens, providing enhanced capabilities for processing longer documents and conversations.",
|
|
"GLM-4.6 is Zhipu's newest model with an extended context window of up to 200k tokens, providing enhanced capabilities for processing longer documents and conversations.",
|
|
|
},
|
|
},
|
|
|
|
|
+ "glm-4.7": {
|
|
|
|
|
+ maxTokens: 16_384,
|
|
|
|
|
+ contextWindow: 204_800,
|
|
|
|
|
+ supportsImages: false,
|
|
|
|
|
+ supportsPromptCache: true,
|
|
|
|
|
+ supportsNativeTools: true,
|
|
|
|
|
+ defaultToolProtocol: "native",
|
|
|
|
|
+ supportsReasoningEffort: ["disable", "medium"],
|
|
|
|
|
+ reasoningEffort: "medium",
|
|
|
|
|
+ preserveReasoning: true,
|
|
|
|
|
+ inputPrice: 0.29,
|
|
|
|
|
+ outputPrice: 1.14,
|
|
|
|
|
+ cacheWritesPrice: 0,
|
|
|
|
|
+ cacheReadsPrice: 0.057,
|
|
|
|
|
+ description:
|
|
|
|
|
+ "GLM-4.7 is Zhipu's latest model with built-in thinking capabilities enabled by default. It provides enhanced reasoning for complex tasks while maintaining fast response times.",
|
|
|
|
|
+ },
|
|
|
} as const satisfies Record<string, ModelInfo>
|
|
} as const satisfies Record<string, ModelInfo>
|
|
|
|
|
|
|
|
export const ZAI_DEFAULT_TEMPERATURE = 0.6
|
|
export const ZAI_DEFAULT_TEMPERATURE = 0.6
|