From 310c7eee92febf5de77711999efcab83bcedfafe Mon Sep 17 00:00:00 2001 From: cpinn <4450689+cpinn@users.noreply.github.com> Date: Thu, 23 Apr 2026 12:22:27 +0000 Subject: [PATCH] fix: add Cerebras models qwen-3-235b-a22b-instruct-2507 and zai-glm-4.7 --- packages/proxy/schema/index.ts | 2 ++ packages/proxy/schema/model_list.json | 31 ++++++++++++++++++++++++++- 2 files changed, 32 insertions(+), 1 deletion(-) diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts index bbf68853..b1c297c7 100644 --- a/packages/proxy/schema/index.ts +++ b/packages/proxy/schema/index.ts @@ -601,6 +601,8 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "grok-2-1212": ["xAI"], "grok-vision-beta": ["xAI"], "grok-beta": ["xAI"], + "qwen-3-235b-a22b-instruct-2507": ["cerebras"], + "zai-glm-4.7": ["cerebras"], "fireworks-ai-4.1b-to-16b": ["fireworks"], "fireworks-ai-56b-to-176b": ["fireworks"], "fireworks-ai-above-16b": ["fireworks"], diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json index 5ecd0f81..03d0f227 100644 --- a/packages/proxy/schema/model_list.json +++ b/packages/proxy/schema/model_list.json @@ -4250,6 +4250,21 @@ "displayName": "Qwen QwQ 32B (Preview) 128k", "experimental": true }, + "qwen-3-235b-a22b-instruct-2507": { + "format": "openai", + "flavor": "chat", + "input_cost_per_mil_tokens": 0.6, + "output_cost_per_mil_tokens": 1.2, + "displayName": "Qwen 3 235B Instruct", + "reasoning": false, + "experimental": true, + "deprecation_date": "2026-05-27", + "max_input_tokens": 131072, + "max_output_tokens": 40960, + "available_providers": [ + "cerebras" + ] + }, "Qwen/QwQ-32B": { "format": "openai", "flavor": "chat", @@ -4982,7 +4997,7 @@ "fireworks" ] }, - "accounts/fireworks/models/kimi-k2p6": { + "accounts/fireworks/models/kimi-k2p6": { "format": "openai", "flavor": "chat", "input_cost_per_mil_tokens": 0.95, @@ -9038,6 +9053,20 @@ "baseten" ] }, + "zai-glm-4.7": { + "format": "openai", + "flavor": "chat", + "input_cost_per_mil_tokens": 2.25, + "output_cost_per_mil_tokens": 2.75, + "displayName": "Z.ai GLM 4.7", + "reasoning": true, + "experimental": true, + "max_input_tokens": 131072, + "max_output_tokens": 40960, + "available_providers": [ + "cerebras" + ] + }, "accounts/fireworks/models/glm-4p5": { "format": "openai", "flavor": "chat",