Skip to content
Open
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
120 changes: 120 additions & 0 deletions packages/types/src/providers/zai.ts
Original file line number Diff line number Diff line change
Expand Up @@ -81,6 +81,18 @@ export const internationalZAiModels = {
description:
"GLM-4.5V is Z.AI's multimodal visual reasoning model (image/video/text/file input), optimized for GUI tasks, grounding, and document/video understanding.",
},
"glm-4.6v": {
maxTokens: 16_384,
contextWindow: 131_072,
supportsImages: true,
supportsPromptCache: true,
inputPrice: 0.3,
outputPrice: 0.9,
cacheWritesPrice: 0,
cacheReadsPrice: 0.05,
description:
"GLM-4.6V is an advanced multimodal vision model with improved performance and cost-efficiency for visual understanding tasks.",
},
"glm-4.6": {
maxTokens: 16_384,
contextWindow: 200_000,
Expand Down Expand Up @@ -108,6 +120,54 @@ export const internationalZAiModels = {
description:
"GLM-4.7 is Zhipu's latest model with built-in thinking capabilities enabled by default. It provides enhanced reasoning for complex tasks while maintaining fast response times.",
},
"glm-4.7-flash": {
maxTokens: 16_384,
contextWindow: 200_000,
supportsImages: false,
supportsPromptCache: true,
inputPrice: 0,
outputPrice: 0,
cacheWritesPrice: 0,
cacheReadsPrice: 0,
description:
"GLM-4.7-Flash is a free, high-speed variant of GLM-4.7 offering fast responses for reasoning and coding tasks.",
},
"glm-4.7-flashx": {
maxTokens: 16_384,
contextWindow: 200_000,
supportsImages: false,
supportsPromptCache: true,
inputPrice: 0.07,
outputPrice: 0.4,
cacheWritesPrice: 0,
cacheReadsPrice: 0.01,
description:
"GLM-4.7-FlashX is an ultra-fast variant of GLM-4.7 with exceptional speed and cost-effectiveness for high-throughput applications.",
},
"glm-4.6v-flash": {
maxTokens: 16_384,
contextWindow: 131_072,
supportsImages: true,
supportsPromptCache: true,
inputPrice: 0,
outputPrice: 0,
cacheWritesPrice: 0,
cacheReadsPrice: 0,
description:
"GLM-4.6V-Flash is a free, high-speed multimodal vision model for rapid image understanding and visual reasoning tasks.",
},
"glm-4.6v-flashx": {
maxTokens: 16_384,
contextWindow: 131_072,
supportsImages: true,
supportsPromptCache: true,
inputPrice: 0.04,
outputPrice: 0.4,
cacheWritesPrice: 0,
cacheReadsPrice: 0.004,
description:
"GLM-4.6V-FlashX is an ultra-fast multimodal vision model optimized for high-speed visual processing at low cost.",
},
"glm-4-32b-0414-128k": {
maxTokens: 16_384,
contextWindow: 131_072,
Expand Down Expand Up @@ -221,6 +281,66 @@ export const mainlandZAiModels = {
description:
"GLM-4.7 is Zhipu's latest model with built-in thinking capabilities enabled by default. It provides enhanced reasoning for complex tasks while maintaining fast response times.",
},
"glm-4.7-flash": {
maxTokens: 16_384,
contextWindow: 204_800,
supportsImages: false,
supportsPromptCache: true,
inputPrice: 0,
outputPrice: 0,
cacheWritesPrice: 0,
cacheReadsPrice: 0,
description:
"GLM-4.7-Flash is a free, high-speed variant of GLM-4.7 offering fast responses for reasoning and coding tasks.",
},
"glm-4.7-flashx": {
maxTokens: 16_384,
contextWindow: 204_800,
supportsImages: false,
supportsPromptCache: true,
inputPrice: 0.035,
outputPrice: 0.2,
cacheWritesPrice: 0,
cacheReadsPrice: 0.005,
description:
"GLM-4.7-FlashX is an ultra-fast variant of GLM-4.7 with exceptional speed and cost-effectiveness for high-throughput applications.",
},
"glm-4.6v": {
maxTokens: 16_384,
contextWindow: 131_072,
supportsImages: true,
supportsPromptCache: true,
inputPrice: 0.15,
outputPrice: 0.45,
cacheWritesPrice: 0,
cacheReadsPrice: 0.025,
description:
"GLM-4.6V is an advanced multimodal vision model with improved performance and cost-efficiency for visual understanding tasks.",
},
"glm-4.6v-flash": {
maxTokens: 16_384,
contextWindow: 131_072,
supportsImages: true,
supportsPromptCache: true,
inputPrice: 0,
outputPrice: 0,
cacheWritesPrice: 0,
cacheReadsPrice: 0,
description:
"GLM-4.6V-Flash is a free, high-speed multimodal vision model for rapid image understanding and visual reasoning tasks.",
},
"glm-4.6v-flashx": {
maxTokens: 16_384,
contextWindow: 131_072,
supportsImages: true,
supportsPromptCache: true,
inputPrice: 0.02,
outputPrice: 0.2,
cacheWritesPrice: 0,
cacheReadsPrice: 0.002,
description:
"GLM-4.6V-FlashX is an ultra-fast multimodal vision model optimized for high-speed visual processing at low cost.",
},
} as const satisfies Record<string, ModelInfo>

export const ZAI_DEFAULT_TEMPERATURE = 0.6
Expand Down
Loading