Skip to content

Commit 6e00997

Browse files
ErdemGKSLerdemgoksel
andauthored
feat: Update Z.AI models with new variants and pricing (#10860)
Co-authored-by: erdemgoksel <erdemgoksel@MAU-BILISIM42>
1 parent 1f7be76 commit 6e00997

1 file changed

Lines changed: 120 additions & 0 deletions

File tree

  • packages/types/src/providers

packages/types/src/providers/zai.ts

Lines changed: 120 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -81,6 +81,18 @@ export const internationalZAiModels = {
8181
description:
8282
"GLM-4.5V is Z.AI's multimodal visual reasoning model (image/video/text/file input), optimized for GUI tasks, grounding, and document/video understanding.",
8383
},
84+
"glm-4.6v": {
85+
maxTokens: 16_384,
86+
contextWindow: 131_072,
87+
supportsImages: true,
88+
supportsPromptCache: true,
89+
inputPrice: 0.3,
90+
outputPrice: 0.9,
91+
cacheWritesPrice: 0,
92+
cacheReadsPrice: 0.05,
93+
description:
94+
"GLM-4.6V is an advanced multimodal vision model with improved performance and cost-efficiency for visual understanding tasks.",
95+
},
8496
"glm-4.6": {
8597
maxTokens: 16_384,
8698
contextWindow: 200_000,
@@ -108,6 +120,54 @@ export const internationalZAiModels = {
108120
description:
109121
"GLM-4.7 is Zhipu's latest model with built-in thinking capabilities enabled by default. It provides enhanced reasoning for complex tasks while maintaining fast response times.",
110122
},
123+
"glm-4.7-flash": {
124+
maxTokens: 16_384,
125+
contextWindow: 200_000,
126+
supportsImages: false,
127+
supportsPromptCache: true,
128+
inputPrice: 0,
129+
outputPrice: 0,
130+
cacheWritesPrice: 0,
131+
cacheReadsPrice: 0,
132+
description:
133+
"GLM-4.7-Flash is a free, high-speed variant of GLM-4.7 offering fast responses for reasoning and coding tasks.",
134+
},
135+
"glm-4.7-flashx": {
136+
maxTokens: 16_384,
137+
contextWindow: 200_000,
138+
supportsImages: false,
139+
supportsPromptCache: true,
140+
inputPrice: 0.07,
141+
outputPrice: 0.4,
142+
cacheWritesPrice: 0,
143+
cacheReadsPrice: 0.01,
144+
description:
145+
"GLM-4.7-FlashX is an ultra-fast variant of GLM-4.7 with exceptional speed and cost-effectiveness for high-throughput applications.",
146+
},
147+
"glm-4.6v-flash": {
148+
maxTokens: 16_384,
149+
contextWindow: 131_072,
150+
supportsImages: true,
151+
supportsPromptCache: true,
152+
inputPrice: 0,
153+
outputPrice: 0,
154+
cacheWritesPrice: 0,
155+
cacheReadsPrice: 0,
156+
description:
157+
"GLM-4.6V-Flash is a free, high-speed multimodal vision model for rapid image understanding and visual reasoning tasks.",
158+
},
159+
"glm-4.6v-flashx": {
160+
maxTokens: 16_384,
161+
contextWindow: 131_072,
162+
supportsImages: true,
163+
supportsPromptCache: true,
164+
inputPrice: 0.04,
165+
outputPrice: 0.4,
166+
cacheWritesPrice: 0,
167+
cacheReadsPrice: 0.004,
168+
description:
169+
"GLM-4.6V-FlashX is an ultra-fast multimodal vision model optimized for high-speed visual processing at low cost.",
170+
},
111171
"glm-4-32b-0414-128k": {
112172
maxTokens: 16_384,
113173
contextWindow: 131_072,
@@ -221,6 +281,66 @@ export const mainlandZAiModels = {
221281
description:
222282
"GLM-4.7 is Zhipu's latest model with built-in thinking capabilities enabled by default. It provides enhanced reasoning for complex tasks while maintaining fast response times.",
223283
},
284+
"glm-4.7-flash": {
285+
maxTokens: 16_384,
286+
contextWindow: 204_800,
287+
supportsImages: false,
288+
supportsPromptCache: true,
289+
inputPrice: 0,
290+
outputPrice: 0,
291+
cacheWritesPrice: 0,
292+
cacheReadsPrice: 0,
293+
description:
294+
"GLM-4.7-Flash is a free, high-speed variant of GLM-4.7 offering fast responses for reasoning and coding tasks.",
295+
},
296+
"glm-4.7-flashx": {
297+
maxTokens: 16_384,
298+
contextWindow: 204_800,
299+
supportsImages: false,
300+
supportsPromptCache: true,
301+
inputPrice: 0.035,
302+
outputPrice: 0.2,
303+
cacheWritesPrice: 0,
304+
cacheReadsPrice: 0.005,
305+
description:
306+
"GLM-4.7-FlashX is an ultra-fast variant of GLM-4.7 with exceptional speed and cost-effectiveness for high-throughput applications.",
307+
},
308+
"glm-4.6v": {
309+
maxTokens: 16_384,
310+
contextWindow: 131_072,
311+
supportsImages: true,
312+
supportsPromptCache: true,
313+
inputPrice: 0.15,
314+
outputPrice: 0.45,
315+
cacheWritesPrice: 0,
316+
cacheReadsPrice: 0.025,
317+
description:
318+
"GLM-4.6V is an advanced multimodal vision model with improved performance and cost-efficiency for visual understanding tasks.",
319+
},
320+
"glm-4.6v-flash": {
321+
maxTokens: 16_384,
322+
contextWindow: 131_072,
323+
supportsImages: true,
324+
supportsPromptCache: true,
325+
inputPrice: 0,
326+
outputPrice: 0,
327+
cacheWritesPrice: 0,
328+
cacheReadsPrice: 0,
329+
description:
330+
"GLM-4.6V-Flash is a free, high-speed multimodal vision model for rapid image understanding and visual reasoning tasks.",
331+
},
332+
"glm-4.6v-flashx": {
333+
maxTokens: 16_384,
334+
contextWindow: 131_072,
335+
supportsImages: true,
336+
supportsPromptCache: true,
337+
inputPrice: 0.02,
338+
outputPrice: 0.2,
339+
cacheWritesPrice: 0,
340+
cacheReadsPrice: 0.002,
341+
description:
342+
"GLM-4.6V-FlashX is an ultra-fast multimodal vision model optimized for high-speed visual processing at low cost.",
343+
},
224344
} as const satisfies Record<string, ModelInfo>
225345

226346
export const ZAI_DEFAULT_TEMPERATURE = 0.6

0 commit comments

Comments
 (0)