diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts index 67d8dab6..a0005b29 100644 --- a/packages/proxy/schema/index.ts +++ b/packages/proxy/schema/index.ts @@ -304,7 +304,7 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "mistral-saba-24b": ["groq"], "mixtral-8x7b-32768": ["groq"], "gemma-7b-it": ["groq"], - "deepseek-r1-distill-llama-70b": ["groq", "cerebras"], + "deepseek-r1-distill-llama-70b": ["groq"], "gemma2-9b-it": ["groq"], "llama-3.3-70b-specdec": ["groq"], "llama-3.2-90b-vision-preview": ["groq"], @@ -330,9 +330,12 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = { "wizardlm-2-8x22b": ["lepton"], "nous-hermes-llama2-13b": ["lepton"], "dolphin-mixtral-8x7b": ["lepton"], - "llama-4-scout-17b-16e-instruct": ["cerebras"], "llama3.1-8b": ["cerebras"], "llama3.3-70b": ["cerebras"], + "qwen-3-32b": ["cerebras"], + "qwen-3-235b-a22b-instruct-2507": ["cerebras"], + "qwen-3-235b-a22b-thinking-2507": ["cerebras"], + "qwen-3-coder-480b": ["cerebras"], "accounts/fireworks/models/llama4-maverick-instruct-basic": ["fireworks"], "accounts/fireworks/models/llama4-scout-instruct-basic": ["fireworks"], "accounts/fireworks/models/llama-v3p3-70b-instruct": ["fireworks"], diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json index 42ca0555..e91d566b 100644 --- a/packages/proxy/schema/model_list.json +++ b/packages/proxy/schema/model_list.json @@ -1072,6 +1072,40 @@ "output_cost_per_mil_tokens": 0.69, "displayName": "OpenAI GPT-OSS (120B)" }, + "qwen-3-32b": { + "format": "openai", + "flavor": "chat", + "input_cost_per_mil_tokens": 0.4, + "output_cost_per_mil_tokens": 0.8, + "displayName": "Qwen 3 32B" + }, + "qwen-3-235b-a22b-instruct-2507": { + "format": "openai", + "flavor": "chat", + "input_cost_per_mil_tokens": 0.6, + "output_cost_per_mil_tokens": 1.2, + "displayName": "Qwen 3 235B Instruct", + "experimental": true, + "max_input_tokens": 131000, + "max_output_tokens": 8192 + }, + "qwen-3-235b-a22b-thinking-2507": { + "format": "openai", + "flavor": "chat", + "input_cost_per_mil_tokens": 0.6, + "output_cost_per_mil_tokens": 2.9, + "displayName": "Qwen 3 235B Thinking", + "experimental": true, + "reasoning": true + }, + "qwen-3-coder-480b": { + "format": "openai", + "flavor": "chat", + "input_cost_per_mil_tokens": 2, + "output_cost_per_mil_tokens": 2, + "displayName": "Qwen 3 Coder 480B", + "experimental": true + }, "meta/llama-2-70b-chat": { "format": "openai", "flavor": "chat",