Frank 5 months ago
parent
commit
74f0edc7a8
1 changed files with 36 additions and 5 deletions
  1. 36 5
      cloud/app/src/routes/zen/v1/chat/completions.ts

+ 36 - 5
cloud/app/src/routes/zen/v1/chat/completions.ts

@@ -21,8 +21,23 @@ const MODELS = {
   //    },
   //    headerMappings: {},
   //  },
-  "qwen/qwen3-coder": {
-    id: "qwen/qwen3-coder" as const,
+  "gpt-5": {
+    id: "gpt-5" as const,
+    auth: true,
+    api: "https://inference.baseten.co",
+    apiKey: Resource.BASETEN_API_KEY.value,
+    model: "Qwen/Qwen3-Coder-480B-A35B-Instruct",
+    cost: {
+      input: 0.00000125,
+      output: 0.00001,
+      reasoning: 0,
+      cacheRead: 0.000000125,
+      cacheWrite: 0,
+    },
+    headerMappings: {},
+  },
+  "qwen3-coder": {
+    id: "qwen3-coder" as const,
     auth: true,
     api: "https://inference.baseten.co",
     apiKey: Resource.BASETEN_API_KEY.value,
@@ -36,8 +51,8 @@ const MODELS = {
     },
     headerMappings: {},
   },
-  "moonshotai/kimi-k2": {
-    id: "moonshotai/kimi-k2" as const,
+  "kimi-k2": {
+    id: "kimi-k2" as const,
     auth: true,
     api: "https://inference.baseten.co",
     apiKey: Resource.BASETEN_API_KEY.value,
@@ -52,7 +67,7 @@ const MODELS = {
     headerMappings: {},
   },
   "grok-code": {
-    id: "x-ai/grok-code-fast-1" as const,
+    id: "grok-code" as const,
     auth: false,
     api: "https://api.x.ai",
     apiKey: Resource.XAI_API_KEY.value,
@@ -69,6 +84,22 @@ const MODELS = {
       "x-grok-req-id": "x-opencode-request",
     },
   },
+  // deprecated
+  "qwen/qwen3-coder": {
+    id: "qwen/qwen3-coder" as const,
+    auth: true,
+    api: "https://inference.baseten.co",
+    apiKey: Resource.BASETEN_API_KEY.value,
+    model: "Qwen/Qwen3-Coder-480B-A35B-Instruct",
+    cost: {
+      input: 0.00000038,
+      output: 0.00000153,
+      reasoning: 0,
+      cacheRead: 0,
+      cacheWrite: 0,
+    },
+    headerMappings: {},
+  },
 }
 
 const FREE_WORKSPACES = [