braintrustdata · Joyce Er (joyceerhl) · Oct 13, 2025 · Oct 20, 2025 · graphite-app · Oct 13, 2025
diff --git a/packages/proxy/schema/index.ts b/packages/proxy/schema/index.ts
@@ -304,7 +304,7 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = {
   "mistral-saba-24b": ["groq"],
   "mixtral-8x7b-32768": ["groq"],
   "gemma-7b-it": ["groq"],
-  "deepseek-r1-distill-llama-70b": ["groq", "cerebras"],
+  "deepseek-r1-distill-llama-70b": ["groq"],
   "gemma2-9b-it": ["groq"],
   "llama-3.3-70b-specdec": ["groq"],
   "llama-3.2-90b-vision-preview": ["groq"],
@@ -330,9 +330,12 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = {
   "wizardlm-2-8x22b": ["lepton"],
   "nous-hermes-llama2-13b": ["lepton"],
   "dolphin-mixtral-8x7b": ["lepton"],
-  "llama-4-scout-17b-16e-instruct": ["cerebras"],
   "llama3.1-8b": ["cerebras"],
   "llama3.3-70b": ["cerebras"],
+  "qwen-3-32b": ["cerebras"],
+  "qwen-3-235b-a22b-instruct-2507": ["cerebras"],
+  "qwen-3-235b-a22b-thinking-2507": ["cerebras"],
+  "qwen-3-coder-480b": ["cerebras"],
   "accounts/fireworks/models/llama4-maverick-instruct-basic": ["fireworks"],
   "accounts/fireworks/models/llama4-scout-instruct-basic": ["fireworks"],
   "accounts/fireworks/models/llama-v3p3-70b-instruct": ["fireworks"],

diff --git a/packages/proxy/schema/model_list.json b/packages/proxy/schema/model_list.json
@@ -1072,6 +1072,40 @@
     "output_cost_per_mil_tokens": 0.69,
     "displayName": "OpenAI GPT-OSS (120B)"
   },
+  "qwen-3-32b": {
+    "format": "openai",
+    "flavor": "chat",
+    "input_cost_per_mil_tokens": 0.4,
+    "output_cost_per_mil_tokens": 0.8,
+    "displayName": "Qwen 3 32B"
+  },
+  "qwen-3-235b-a22b-instruct-2507": {
+    "format": "openai",
+    "flavor": "chat",
+    "input_cost_per_mil_tokens": 0.6,
+    "output_cost_per_mil_tokens": 1.2,
+    "displayName": "Qwen 3 235B Instruct",
+    "experimental": true,
+    "max_input_tokens": 131000,
+    "max_output_tokens": 8192
+  },
+  "qwen-3-235b-a22b-thinking-2507": {
+    "format": "openai",
+    "flavor": "chat",
+    "input_cost_per_mil_tokens": 0.6,
+    "output_cost_per_mil_tokens": 2.9,
+    "displayName": "Qwen 3 235B Thinking",
+    "experimental": true,
+    "reasoning": true
+  },
+  "qwen-3-coder-480b": {
+    "format": "openai",
+    "flavor": "chat",
+    "input_cost_per_mil_tokens": 2,
+    "output_cost_per_mil_tokens": 2,
+    "displayName": "Qwen 3 Coder 480B",
+    "experimental": true
+  },
   "meta/llama-2-70b-chat": {
     "format": "openai",
     "flavor": "chat",
@@ -2212,7 +2246,7 @@
     "output_cost_per_mil_tokens": 0.1,
     "displayName": "Llama 3.3 70B"
   },
-  "llama3.1-8b": {
+    "llama3.1-8b": {
     "format": "openai",
     "flavor": "chat",
     "input_cost_per_mil_tokens": 0.1,