6 месяцев назад · 20e818ad05
--- a/cloud/function/src/gateway.ts
+++ b/cloud/function/src/gateway.ts
@@ -178,456 +178,470 @@ const RestAuth: MiddlewareHandler = async (c, next) => {
 
				 const app = new Hono<{ Bindings: Env; Variables: { keyRecord?: { id: string; workspaceID: string } } }>()
			
 
				   .get("/", (c) => c.text("Hello, world!"))
			
 
				   .post("/v1/chat/completions", GatewayAuth, async (c) => {
			
 
				-    try {
			
 
				-      const body = await c.req.json<ChatCompletionCreateParamsBase>()
			
 
				+    const keyRecord = c.get("keyRecord")!
			
 
				 
			
 
				-      const model = SUPPORTED_MODELS[body.model as keyof typeof SUPPORTED_MODELS]?.model()
			
 
				-      if (!model) throw new Error(`Unsupported model: ${body.model}`)
			
 
				+    return await Actor.provide("system", { workspaceID: keyRecord.workspaceID }, async () => {
			
 
				+      try {
			
 
				+        // Check balance
			
 
				+        const customer = await Billing.get()
			
 
				+        if (customer.balance <= 0) {
			
 
				+          return c.json(
			
 
				+            {
			
 
				+              error: {
			
 
				+                message: "Insufficient balance",
			
 
				+                type: "insufficient_quota",
			
 
				+                param: null,
			
 
				+                code: "insufficient_quota",
			
 
				+              },
			
 
				+            },
			
 
				+            401,
			
 
				+          )
			
 
				+        }
			
 
				 
			
 
				-      const requestBody = transformOpenAIRequestToAiSDK()
			
 
				+        const body = await c.req.json<ChatCompletionCreateParamsBase>()
			
 
				+        const model = SUPPORTED_MODELS[body.model as keyof typeof SUPPORTED_MODELS]?.model()
			
 
				+        if (!model) throw new Error(`Unsupported model: ${body.model}`)
			
 
				 
			
 
				-      return body.stream ? await handleStream() : await handleGenerate()
			
 
				+        const requestBody = transformOpenAIRequestToAiSDK()
			
 
				 
			
 
				-      async function handleStream() {
			
 
				-        const result = await model.doStream({
			
 
				-          ...requestBody,
			
 
				-        })
			
 
				+        return body.stream ? await handleStream() : await handleGenerate()
			
 
				+
			
 
				+        async function handleStream() {
			
 
				+          const result = await model.doStream({
			
 
				+            ...requestBody,
			
 
				+          })
			
 
				 
			
 
				-        const encoder = new TextEncoder()
			
 
				-        const stream = new ReadableStream({
			
 
				-          async start(controller) {
			
 
				-            const id = `chatcmpl-${Date.now()}`
			
 
				-            const created = Math.floor(Date.now() / 1000)
			
 
				-
			
 
				-            try {
			
 
				-              for await (const chunk of result.stream) {
			
 
				-                console.log("!!! CHUNK !!! : " + chunk.type)
			
 
				-                switch (chunk.type) {
			
 
				-                  case "text-delta": {
			
 
				-                    const data = {
			
 
				-                      id,
			
 
				-                      object: "chat.completion.chunk",
			
 
				-                      created,
			
 
				-                      model: body.model,
			
 
				-                      choices: [
			
 
				-                        {
			
 
				-                          index: 0,
			
 
				-                          delta: {
			
 
				-                            content: chunk.delta,
			
 
				+          const encoder = new TextEncoder()
			
 
				+          const stream = new ReadableStream({
			
 
				+            async start(controller) {
			
 
				+              const id = `chatcmpl-${Date.now()}`
			
 
				+              const created = Math.floor(Date.now() / 1000)
			
 
				+
			
 
				+              try {
			
 
				+                for await (const chunk of result.stream) {
			
 
				+                  console.log("!!! CHUNK !!! : " + chunk.type)
			
 
				+                  switch (chunk.type) {
			
 
				+                    case "text-delta": {
			
 
				+                      const data = {
			
 
				+                        id,
			
 
				+                        object: "chat.completion.chunk",
			
 
				+                        created,
			
 
				+                        model: body.model,
			
 
				+                        choices: [
			
 
				+                          {
			
 
				+                            index: 0,
			
 
				+                            delta: {
			
 
				+                              content: chunk.delta,
			
 
				+                            },
			
 
				+                            finish_reason: null,
			
 
				                           },
			
 
				-                          finish_reason: null,
			
 
				-                        },
			
 
				-                      ],
			
 
				+                        ],
			
 
				+                      }
			
 
				+                      controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				+                      break
			
 
				                     }
			
 
				-                    controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				-                    break
			
 
				-                  }
			
 
				 
			
 
				-                  case "reasoning-delta": {
			
 
				-                    const data = {
			
 
				-                      id,
			
 
				-                      object: "chat.completion.chunk",
			
 
				-                      created,
			
 
				-                      model: body.model,
			
 
				-                      choices: [
			
 
				-                        {
			
 
				-                          index: 0,
			
 
				-                          delta: {
			
 
				-                            reasoning_content: chunk.delta,
			
 
				+                    case "reasoning-delta": {
			
 
				+                      const data = {
			
 
				+                        id,
			
 
				+                        object: "chat.completion.chunk",
			
 
				+                        created,
			
 
				+                        model: body.model,
			
 
				+                        choices: [
			
 
				+                          {
			
 
				+                            index: 0,
			
 
				+                            delta: {
			
 
				+                              reasoning_content: chunk.delta,
			
 
				+                            },
			
 
				+                            finish_reason: null,
			
 
				                           },
			
 
				-                          finish_reason: null,
			
 
				-                        },
			
 
				-                      ],
			
 
				+                        ],
			
 
				+                      }
			
 
				+                      controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				+                      break
			
 
				                     }
			
 
				-                    controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				-                    break
			
 
				-                  }
			
 
				 
			
 
				-                  case "tool-call": {
			
 
				-                    const data = {
			
 
				-                      id,
			
 
				-                      object: "chat.completion.chunk",
			
 
				-                      created,
			
 
				-                      model: body.model,
			
 
				-                      choices: [
			
 
				-                        {
			
 
				-                          index: 0,
			
 
				-                          delta: {
			
 
				-                            tool_calls: [
			
 
				-                              {
			
 
				-                                index: 0,
			
 
				-                                id: chunk.toolCallId,
			
 
				-                                type: "function",
			
 
				-                                function: {
			
 
				-                                  name: chunk.toolName,
			
 
				-                                  arguments: chunk.input,
			
 
				+                    case "tool-call": {
			
 
				+                      const data = {
			
 
				+                        id,
			
 
				+                        object: "chat.completion.chunk",
			
 
				+                        created,
			
 
				+                        model: body.model,
			
 
				+                        choices: [
			
 
				+                          {
			
 
				+                            index: 0,
			
 
				+                            delta: {
			
 
				+                              tool_calls: [
			
 
				+                                {
			
 
				+                                  index: 0,
			
 
				+                                  id: chunk.toolCallId,
			
 
				+                                  type: "function",
			
 
				+                                  function: {
			
 
				+                                    name: chunk.toolName,
			
 
				+                                    arguments: chunk.input,
			
 
				+                                  },
			
 
				                                 },
			
 
				-                              },
			
 
				-                            ],
			
 
				+                              ],
			
 
				+                            },
			
 
				+                            finish_reason: null,
			
 
				                           },
			
 
				-                          finish_reason: null,
			
 
				-                        },
			
 
				-                      ],
			
 
				+                        ],
			
 
				+                      }
			
 
				+                      controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				+                      break
			
 
				                     }
			
 
				-                    controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				-                    break
			
 
				-                  }
			
 
				 
			
 
				-                  case "error": {
			
 
				-                    const data = {
			
 
				-                      id,
			
 
				-                      object: "chat.completion.chunk",
			
 
				-                      created,
			
 
				-                      model: body.model,
			
 
				-                      choices: [
			
 
				-                        {
			
 
				-                          index: 0,
			
 
				-                          delta: {},
			
 
				-                          finish_reason: "stop",
			
 
				+                    case "error": {
			
 
				+                      const data = {
			
 
				+                        id,
			
 
				+                        object: "chat.completion.chunk",
			
 
				+                        created,
			
 
				+                        model: body.model,
			
 
				+                        choices: [
			
 
				+                          {
			
 
				+                            index: 0,
			
 
				+                            delta: {},
			
 
				+                            finish_reason: "stop",
			
 
				+                          },
			
 
				+                        ],
			
 
				+                        error: {
			
 
				+                          message: typeof chunk.error === "string" ? chunk.error : chunk.error,
			
 
				+                          type: "server_error",
			
 
				                         },
			
 
				-                      ],
			
 
				-                      error: {
			
 
				-                        message: typeof chunk.error === "string" ? chunk.error : chunk.error,
			
 
				-                        type: "server_error",
			
 
				-                      },
			
 
				+                      }
			
 
				+                      controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				+                      controller.enqueue(encoder.encode("data: [DONE]\n\n"))
			
 
				+                      controller.close()
			
 
				+                      break
			
 
				                     }
			
 
				-                    controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				-                    controller.enqueue(encoder.encode("data: [DONE]\n\n"))
			
 
				-                    controller.close()
			
 
				-                    break
			
 
				-                  }
			
 
				 
			
 
				-                  case "finish": {
			
 
				-                    const data = {
			
 
				-                      id,
			
 
				-                      object: "chat.completion.chunk",
			
 
				-                      created,
			
 
				-                      model: body.model,
			
 
				-                      choices: [
			
 
				-                        {
			
 
				-                          index: 0,
			
 
				-                          delta: {},
			
 
				-                          finish_reason:
			
 
				-                            {
			
 
				-                              stop: "stop",
			
 
				-                              length: "length",
			
 
				-                              "content-filter": "content_filter",
			
 
				-                              "tool-calls": "tool_calls",
			
 
				-                              error: "stop",
			
 
				-                              other: "stop",
			
 
				-                              unknown: "stop",
			
 
				-                            }[chunk.finishReason] || "stop",
			
 
				-                        },
			
 
				-                      ],
			
 
				-                      usage: {
			
 
				-                        prompt_tokens: chunk.usage.inputTokens,
			
 
				-                        completion_tokens: chunk.usage.outputTokens,
			
 
				-                        total_tokens: chunk.usage.totalTokens,
			
 
				-                        completion_tokens_details: {
			
 
				-                          reasoning_tokens: chunk.usage.reasoningTokens,
			
 
				-                        },
			
 
				-                        prompt_tokens_details: {
			
 
				-                          cached_tokens: chunk.usage.cachedInputTokens,
			
 
				+                    case "finish": {
			
 
				+                      const data = {
			
 
				+                        id,
			
 
				+                        object: "chat.completion.chunk",
			
 
				+                        created,
			
 
				+                        model: body.model,
			
 
				+                        choices: [
			
 
				+                          {
			
 
				+                            index: 0,
			
 
				+                            delta: {},
			
 
				+                            finish_reason:
			
 
				+                              {
			
 
				+                                stop: "stop",
			
 
				+                                length: "length",
			
 
				+                                "content-filter": "content_filter",
			
 
				+                                "tool-calls": "tool_calls",
			
 
				+                                error: "stop",
			
 
				+                                other: "stop",
			
 
				+                                unknown: "stop",
			
 
				+                              }[chunk.finishReason] || "stop",
			
 
				+                          },
			
 
				+                        ],
			
 
				+                        usage: {
			
 
				+                          prompt_tokens: chunk.usage.inputTokens,
			
 
				+                          completion_tokens: chunk.usage.outputTokens,
			
 
				+                          total_tokens: chunk.usage.totalTokens,
			
 
				+                          completion_tokens_details: {
			
 
				+                            reasoning_tokens: chunk.usage.reasoningTokens,
			
 
				+                          },
			
 
				+                          prompt_tokens_details: {
			
 
				+                            cached_tokens: chunk.usage.cachedInputTokens,
			
 
				+                          },
			
 
				                         },
			
 
				-                      },
			
 
				+                      }
			
 
				+                      await trackUsage(body.model, chunk.usage, chunk.providerMetadata)
			
 
				+                      controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				+                      controller.enqueue(encoder.encode("data: [DONE]\n\n"))
			
 
				+                      controller.close()
			
 
				+                      break
			
 
				                     }
			
 
				-                    await trackUsage(body.model, chunk.usage, chunk.providerMetadata)
			
 
				-                    controller.enqueue(encoder.encode(`data: ${JSON.stringify(data)}\n\n`))
			
 
				-                    controller.enqueue(encoder.encode("data: [DONE]\n\n"))
			
 
				-                    controller.close()
			
 
				-                    break
			
 
				-                  }
			
 
				 
			
 
				-                  //case "stream-start":
			
 
				-                  //case "response-metadata":
			
 
				-                  case "text-start":
			
 
				-                  case "text-end":
			
 
				-                  case "reasoning-start":
			
 
				-                  case "reasoning-end":
			
 
				-                  case "tool-input-start":
			
 
				-                  case "tool-input-delta":
			
 
				-                  case "tool-input-end":
			
 
				-                  case "raw":
			
 
				-                  default:
			
 
				-                    // Log unknown chunk types for debugging
			
 
				-                    console.warn(`Unknown chunk type: ${(chunk as any).type}`)
			
 
				-                    break
			
 
				+                    //case "stream-start":
			
 
				+                    //case "response-metadata":
			
 
				+                    case "text-start":
			
 
				+                    case "text-end":
			
 
				+                    case "reasoning-start":
			
 
				+                    case "reasoning-end":
			
 
				+                    case "tool-input-start":
			
 
				+                    case "tool-input-delta":
			
 
				+                    case "tool-input-end":
			
 
				+                    case "raw":
			
 
				+                    default:
			
 
				+                      // Log unknown chunk types for debugging
			
 
				+                      console.warn(`Unknown chunk type: ${(chunk as any).type}`)
			
 
				+                      break
			
 
				+                  }
			
 
				                 }
			
 
				+              } catch (error) {
			
 
				+                controller.error(error)
			
 
				               }
			
 
				-            } catch (error) {
			
 
				-              controller.error(error)
			
 
				-            }
			
 
				-          },
			
 
				-        })
			
 
				-
			
 
				-        return new Response(stream, {
			
 
				-          headers: {
			
 
				-            "Content-Type": "text/plain; charset=utf-8",
			
 
				-            "Cache-Control": "no-cache",
			
 
				-            Connection: "keep-alive",
			
 
				-          },
			
 
				-        })
			
 
				-      }
			
 
				-
			
 
				-      async function handleGenerate() {
			
 
				-        const response = await model.doGenerate({
			
 
				-          ...requestBody,
			
 
				-        })
			
 
				-        await trackUsage(body.model, response.usage, response.providerMetadata)
			
 
				-        return c.json({
			
 
				-          id: `chatcmpl-${Date.now()}`,
			
 
				-          object: "chat.completion" as const,
			
 
				-          created: Math.floor(Date.now() / 1000),
			
 
				-          model: body.model,
			
 
				-          choices: [
			
 
				-            {
			
 
				-              index: 0,
			
 
				-              message: {
			
 
				-                role: "assistant" as const,
			
 
				-                content: response.content?.find((c) => c.type === "text")?.text ?? "",
			
 
				-                reasoning_content: response.content?.find((c) => c.type === "reasoning")?.text,
			
 
				-                tool_calls: response.content
			
 
				-                  ?.filter((c) => c.type === "tool-call")
			
 
				-                  .map((toolCall) => ({
			
 
				-                    id: toolCall.toolCallId,
			
 
				-                    type: "function" as const,
			
 
				-                    function: {
			
 
				-                      name: toolCall.toolName,
			
 
				-                      arguments: toolCall.input,
			
 
				-                    },
			
 
				-                  })),
			
 
				-              },
			
 
				-              finish_reason:
			
 
				-                (
			
 
				-                  {
			
 
				-                    stop: "stop",
			
 
				-                    length: "length",
			
 
				-                    "content-filter": "content_filter",
			
 
				-                    "tool-calls": "tool_calls",
			
 
				-                    error: "stop",
			
 
				-                    other: "stop",
			
 
				-                    unknown: "stop",
			
 
				-                  } as const
			
 
				-                )[response.finishReason] || "stop",
			
 
				             },
			
 
				-          ],
			
 
				-          usage: {
			
 
				-            prompt_tokens: response.usage?.inputTokens,
			
 
				-            completion_tokens: response.usage?.outputTokens,
			
 
				-            total_tokens: response.usage?.totalTokens,
			
 
				-            completion_tokens_details: {
			
 
				-              reasoning_tokens: response.usage?.reasoningTokens,
			
 
				-            },
			
 
				-            prompt_tokens_details: {
			
 
				-              cached_tokens: response.usage?.cachedInputTokens,
			
 
				+          })
			
 
				+
			
 
				+          return new Response(stream, {
			
 
				+            headers: {
			
 
				+              "Content-Type": "text/plain; charset=utf-8",
			
 
				+              "Cache-Control": "no-cache",
			
 
				+              Connection: "keep-alive",
			
 
				             },
			
 
				-          },
			
 
				-        })
			
 
				-      }
			
 
				+          })
			
 
				+        }
			
 
				 
			
 
				-      function transformOpenAIRequestToAiSDK() {
			
 
				-        const prompt = transformMessages()
			
 
				-        const tools = transformTools()
			
 
				-
			
 
				-        return {
			
 
				-          prompt,
			
 
				-          maxOutputTokens: body.max_tokens ?? body.max_completion_tokens ?? undefined,
			
 
				-          temperature: body.temperature ?? undefined,
			
 
				-          topP: body.top_p ?? undefined,
			
 
				-          frequencyPenalty: body.frequency_penalty ?? undefined,
			
 
				-          presencePenalty: body.presence_penalty ?? undefined,
			
 
				-          providerOptions: body.reasoning_effort
			
 
				-            ? {
			
 
				-                anthropic: {
			
 
				-                  reasoningEffort: body.reasoning_effort,
			
 
				+        async function handleGenerate() {
			
 
				+          const response = await model.doGenerate({
			
 
				+            ...requestBody,
			
 
				+          })
			
 
				+          await trackUsage(body.model, response.usage, response.providerMetadata)
			
 
				+          return c.json({
			
 
				+            id: `chatcmpl-${Date.now()}`,
			
 
				+            object: "chat.completion" as const,
			
 
				+            created: Math.floor(Date.now() / 1000),
			
 
				+            model: body.model,
			
 
				+            choices: [
			
 
				+              {
			
 
				+                index: 0,
			
 
				+                message: {
			
 
				+                  role: "assistant" as const,
			
 
				+                  content: response.content?.find((c) => c.type === "text")?.text ?? "",
			
 
				+                  reasoning_content: response.content?.find((c) => c.type === "reasoning")?.text,
			
 
				+                  tool_calls: response.content
			
 
				+                    ?.filter((c) => c.type === "tool-call")
			
 
				+                    .map((toolCall) => ({
			
 
				+                      id: toolCall.toolCallId,
			
 
				+                      type: "function" as const,
			
 
				+                      function: {
			
 
				+                        name: toolCall.toolName,
			
 
				+                        arguments: toolCall.input,
			
 
				+                      },
			
 
				+                    })),
			
 
				                 },
			
 
				-              }
			
 
				-            : undefined,
			
 
				-          stopSequences: (typeof body.stop === "string" ? [body.stop] : body.stop) ?? undefined,
			
 
				-          responseFormat: (() => {
			
 
				-            if (!body.response_format) return { type: "text" as const }
			
 
				-            if (body.response_format.type === "json_schema")
			
 
				-              return {
			
 
				-                type: "json" as const,
			
 
				-                schema: body.response_format.json_schema.schema,
			
 
				-                name: body.response_format.json_schema.name,
			
 
				-                description: body.response_format.json_schema.description,
			
 
				-              }
			
 
				-            if (body.response_format.type === "json_object") return { type: "json" as const }
			
 
				-            throw new Error("Unsupported response format")
			
 
				-          })(),
			
 
				-          seed: body.seed ?? undefined,
			
 
				-          tools: tools.tools,
			
 
				-          toolChoice: tools.toolChoice,
			
 
				+                finish_reason:
			
 
				+                  (
			
 
				+                    {
			
 
				+                      stop: "stop",
			
 
				+                      length: "length",
			
 
				+                      "content-filter": "content_filter",
			
 
				+                      "tool-calls": "tool_calls",
			
 
				+                      error: "stop",
			
 
				+                      other: "stop",
			
 
				+                      unknown: "stop",
			
 
				+                    } as const
			
 
				+                  )[response.finishReason] || "stop",
			
 
				+              },
			
 
				+            ],
			
 
				+            usage: {
			
 
				+              prompt_tokens: response.usage?.inputTokens,
			
 
				+              completion_tokens: response.usage?.outputTokens,
			
 
				+              total_tokens: response.usage?.totalTokens,
			
 
				+              completion_tokens_details: {
			
 
				+                reasoning_tokens: response.usage?.reasoningTokens,
			
 
				+              },
			
 
				+              prompt_tokens_details: {
			
 
				+                cached_tokens: response.usage?.cachedInputTokens,
			
 
				+              },
			
 
				+            },
			
 
				+          })
			
 
				         }
			
 
				 
			
 
				-        function transformTools() {
			
 
				-          const { tools, tool_choice } = body
			
 
				-
			
 
				-          if (!tools || tools.length === 0) {
			
 
				-            return { tools: undefined, toolChoice: undefined }
			
 
				+        function transformOpenAIRequestToAiSDK() {
			
 
				+          const prompt = transformMessages()
			
 
				+          const tools = transformTools()
			
 
				+
			
 
				+          return {
			
 
				+            prompt,
			
 
				+            maxOutputTokens: body.max_tokens ?? body.max_completion_tokens ?? undefined,
			
 
				+            temperature: body.temperature ?? undefined,
			
 
				+            topP: body.top_p ?? undefined,
			
 
				+            frequencyPenalty: body.frequency_penalty ?? undefined,
			
 
				+            presencePenalty: body.presence_penalty ?? undefined,
			
 
				+            providerOptions: body.reasoning_effort
			
 
				+              ? {
			
 
				+                  anthropic: {
			
 
				+                    reasoningEffort: body.reasoning_effort,
			
 
				+                  },
			
 
				+                }
			
 
				+              : undefined,
			
 
				+            stopSequences: (typeof body.stop === "string" ? [body.stop] : body.stop) ?? undefined,
			
 
				+            responseFormat: (() => {
			
 
				+              if (!body.response_format) return { type: "text" as const }
			
 
				+              if (body.response_format.type === "json_schema")
			
 
				+                return {
			
 
				+                  type: "json" as const,
			
 
				+                  schema: body.response_format.json_schema.schema,
			
 
				+                  name: body.response_format.json_schema.name,
			
 
				+                  description: body.response_format.json_schema.description,
			
 
				+                }
			
 
				+              if (body.response_format.type === "json_object") return { type: "json" as const }
			
 
				+              throw new Error("Unsupported response format")
			
 
				+            })(),
			
 
				+            seed: body.seed ?? undefined,
			
 
				+            tools: tools.tools,
			
 
				+            toolChoice: tools.toolChoice,
			
 
				           }
			
 
				 
			
 
				-          const aiSdkTools = tools.map((tool) => {
			
 
				-            return {
			
 
				-              type: tool.type,
			
 
				-              name: tool.function.name,
			
 
				-              description: tool.function.description,
			
 
				-              inputSchema: tool.function.parameters!,
			
 
				-            }
			
 
				-          })
			
 
				+          function transformTools() {
			
 
				+            const { tools, tool_choice } = body
			
 
				 
			
 
				-          let aiSdkToolChoice
			
 
				-          if (tool_choice == null) {
			
 
				-            aiSdkToolChoice = undefined
			
 
				-          } else if (tool_choice === "auto") {
			
 
				-            aiSdkToolChoice = { type: "auto" as const }
			
 
				-          } else if (tool_choice === "none") {
			
 
				-            aiSdkToolChoice = { type: "none" as const }
			
 
				-          } else if (tool_choice === "required") {
			
 
				-            aiSdkToolChoice = { type: "required" as const }
			
 
				-          } else if (tool_choice.type === "function") {
			
 
				-            aiSdkToolChoice = {
			
 
				-              type: "tool" as const,
			
 
				-              toolName: tool_choice.function.name,
			
 
				+            if (!tools || tools.length === 0) {
			
 
				+              return { tools: undefined, toolChoice: undefined }
			
 
				             }
			
 
				-          }
			
 
				 
			
 
				-          return { tools: aiSdkTools, toolChoice: aiSdkToolChoice }
			
 
				-        }
			
 
				+            const aiSdkTools = tools.map((tool) => {
			
 
				+              return {
			
 
				+                type: tool.type,
			
 
				+                name: tool.function.name,
			
 
				+                description: tool.function.description,
			
 
				+                inputSchema: tool.function.parameters!,
			
 
				+              }
			
 
				+            })
			
 
				 
			
 
				-        function transformMessages() {
			
 
				-          const { messages } = body
			
 
				-          const prompt: LanguageModelV2Prompt = []
			
 
				-
			
 
				-          for (const message of messages) {
			
 
				-            switch (message.role) {
			
 
				-              case "system": {
			
 
				-                prompt.push({
			
 
				-                  role: "system",
			
 
				-                  content: message.content as string,
			
 
				-                })
			
 
				-                break
			
 
				+            let aiSdkToolChoice
			
 
				+            if (tool_choice == null) {
			
 
				+              aiSdkToolChoice = undefined
			
 
				+            } else if (tool_choice === "auto") {
			
 
				+              aiSdkToolChoice = { type: "auto" as const }
			
 
				+            } else if (tool_choice === "none") {
			
 
				+              aiSdkToolChoice = { type: "none" as const }
			
 
				+            } else if (tool_choice === "required") {
			
 
				+              aiSdkToolChoice = { type: "required" as const }
			
 
				+            } else if (tool_choice.type === "function") {
			
 
				+              aiSdkToolChoice = {
			
 
				+                type: "tool" as const,
			
 
				+                toolName: tool_choice.function.name,
			
 
				               }
			
 
				+            }
			
 
				 
			
 
				-              case "user": {
			
 
				-                if (typeof message.content === "string") {
			
 
				+            return { tools: aiSdkTools, toolChoice: aiSdkToolChoice }
			
 
				+          }
			
 
				+
			
 
				+          function transformMessages() {
			
 
				+            const { messages } = body
			
 
				+            const prompt: LanguageModelV2Prompt = []
			
 
				+
			
 
				+            for (const message of messages) {
			
 
				+              switch (message.role) {
			
 
				+                case "system": {
			
 
				                   prompt.push({
			
 
				-                    role: "user",
			
 
				-                    content: [{ type: "text", text: message.content }],
			
 
				-                  })
			
 
				-                } else {
			
 
				-                  const content = message.content.map((part) => {
			
 
				-                    switch (part.type) {
			
 
				-                      case "text":
			
 
				-                        return { type: "text" as const, text: part.text }
			
 
				-                      case "image_url":
			
 
				-                        return {
			
 
				-                          type: "file" as const,
			
 
				-                          mediaType: "image/jpeg" as const,
			
 
				-                          data: part.image_url.url,
			
 
				-                        }
			
 
				-                      default:
			
 
				-                        throw new Error(`Unsupported content part type: ${(part as any).type}`)
			
 
				-                    }
			
 
				-                  })
			
 
				-                  prompt.push({
			
 
				-                    role: "user",
			
 
				-                    content,
			
 
				+                    role: "system",
			
 
				+                    content: message.content as string,
			
 
				                   })
			
 
				+                  break
			
 
				                 }
			
 
				-                break
			
 
				-              }
			
 
				-
			
 
				-              case "assistant": {
			
 
				-                const content: Array<
			
 
				-                  | { type: "text"; text: string }
			
 
				-                  | {
			
 
				-                      type: "tool-call"
			
 
				-                      toolCallId: string
			
 
				-                      toolName: string
			
 
				-                      input: any
			
 
				-                    }
			
 
				-                > = []
			
 
				 
			
 
				-                if (message.content) {
			
 
				-                  content.push({
			
 
				-                    type: "text",
			
 
				-                    text: message.content as string,
			
 
				-                  })
			
 
				+                case "user": {
			
 
				+                  if (typeof message.content === "string") {
			
 
				+                    prompt.push({
			
 
				+                      role: "user",
			
 
				+                      content: [{ type: "text", text: message.content }],
			
 
				+                    })
			
 
				+                  } else {
			
 
				+                    const content = message.content.map((part) => {
			
 
				+                      switch (part.type) {
			
 
				+                        case "text":
			
 
				+                          return { type: "text" as const, text: part.text }
			
 
				+                        case "image_url":
			
 
				+                          return {
			
 
				+                            type: "file" as const,
			
 
				+                            mediaType: "image/jpeg" as const,
			
 
				+                            data: part.image_url.url,
			
 
				+                          }
			
 
				+                        default:
			
 
				+                          throw new Error(`Unsupported content part type: ${(part as any).type}`)
			
 
				+                      }
			
 
				+                    })
			
 
				+                    prompt.push({
			
 
				+                      role: "user",
			
 
				+                      content,
			
 
				+                    })
			
 
				+                  }
			
 
				+                  break
			
 
				                 }
			
 
				 
			
 
				-                if (message.tool_calls) {
			
 
				-                  for (const toolCall of message.tool_calls) {
			
 
				+                case "assistant": {
			
 
				+                  const content: Array<
			
 
				+                    | { type: "text"; text: string }
			
 
				+                    | {
			
 
				+                        type: "tool-call"
			
 
				+                        toolCallId: string
			
 
				+                        toolName: string
			
 
				+                        input: any
			
 
				+                      }
			
 
				+                  > = []
			
 
				+
			
 
				+                  if (message.content) {
			
 
				                     content.push({
			
 
				-                      type: "tool-call",
			
 
				-                      toolCallId: toolCall.id,
			
 
				-                      toolName: toolCall.function.name,
			
 
				-                      input: JSON.parse(toolCall.function.arguments),
			
 
				+                      type: "text",
			
 
				+                      text: message.content as string,
			
 
				                     })
			
 
				                   }
			
 
				-                }
			
 
				 
			
 
				-                prompt.push({
			
 
				-                  role: "assistant",
			
 
				-                  content,
			
 
				-                })
			
 
				-                break
			
 
				-              }
			
 
				+                  if (message.tool_calls) {
			
 
				+                    for (const toolCall of message.tool_calls) {
			
 
				+                      content.push({
			
 
				+                        type: "tool-call",
			
 
				+                        toolCallId: toolCall.id,
			
 
				+                        toolName: toolCall.function.name,
			
 
				+                        input: JSON.parse(toolCall.function.arguments),
			
 
				+                      })
			
 
				+                    }
			
 
				+                  }
			
 
				 
			
 
				-              case "tool": {
			
 
				-                prompt.push({
			
 
				-                  role: "tool",
			
 
				-                  content: [
			
 
				-                    {
			
 
				-                      type: "tool-result",
			
 
				-                      toolName: "placeholder",
			
 
				-                      toolCallId: message.tool_call_id,
			
 
				-                      output: {
			
 
				-                        type: "text",
			
 
				-                        value: message.content as string,
			
 
				+                  prompt.push({
			
 
				+                    role: "assistant",
			
 
				+                    content,
			
 
				+                  })
			
 
				+                  break
			
 
				+                }
			
 
				+
			
 
				+                case "tool": {
			
 
				+                  prompt.push({
			
 
				+                    role: "tool",
			
 
				+                    content: [
			
 
				+                      {
			
 
				+                        type: "tool-result",
			
 
				+                        toolName: "placeholder",
			
 
				+                        toolCallId: message.tool_call_id,
			
 
				+                        output: {
			
 
				+                          type: "text",
			
 
				+                          value: message.content as string,
			
 
				+                        },
			
 
				                       },
			
 
				-                    },
			
 
				-                  ],
			
 
				-                })
			
 
				-                break
			
 
				-              }
			
 
				+                    ],
			
 
				+                  })
			
 
				+                  break
			
 
				+                }
			
 
				 
			
 
				-              default: {
			
 
				-                throw new Error(`Unsupported message role: ${message.role}`)
			
 
				+                default: {
			
 
				+                  throw new Error(`Unsupported message role: ${message.role}`)
			
 
				+                }
			
 
				               }
			
 
				             }
			
 
				-          }
			
 
				 
			
 
				-          return prompt
			
 
				+            return prompt
			
 
				+          }
			
 
				         }
			
 
				-      }
			
 
				 
			
 
				-      async function trackUsage(model: string, usage: LanguageModelUsage, providerMetadata?: ProviderMetadata) {
			
 
				-        const keyRecord = c.get("keyRecord")
			
 
				-        if (!keyRecord) return
			
 
				-
			
 
				-        const modelData = SUPPORTED_MODELS[model as keyof typeof SUPPORTED_MODELS]
			
 
				-        if (!modelData) throw new Error(`Unsupported model: ${model}`)
			
 
				-
			
 
				-        const inputTokens = usage.inputTokens ?? 0
			
 
				-        const outputTokens = usage.outputTokens ?? 0
			
 
				-        const reasoningTokens = usage.reasoningTokens ?? 0
			
 
				-        const cacheReadTokens = usage.cachedInputTokens ?? 0
			
 
				-        const cacheWriteTokens =
			
 
				-          providerMetadata?.["anthropic"]?.["cacheCreationInputTokens"] ??
			
 
				-          // @ts-expect-error
			
 
				-          providerMetadata?.["bedrock"]?.["usage"]?.["cacheWriteInputTokens"] ??
			
 
				-          0
			
 
				-
			
 
				-        const inputCost = modelData.input * inputTokens
			
 
				-        const outputCost = modelData.output * outputTokens
			
 
				-        const reasoningCost = modelData.reasoning * reasoningTokens
			
 
				-        const cacheReadCost = modelData.cacheRead * cacheReadTokens
			
 
				-        const cacheWriteCost = modelData.cacheWrite * cacheWriteTokens
			
 
				-        const costInCents = (inputCost + outputCost + reasoningCost + cacheReadCost + cacheWriteCost) * 100
			
 
				-
			
 
				-        await Actor.provide("system", { workspaceID: keyRecord.workspaceID }, async () => {
			
 
				+        async function trackUsage(model: string, usage: LanguageModelUsage, providerMetadata?: ProviderMetadata) {
			
 
				+          const modelData = SUPPORTED_MODELS[model as keyof typeof SUPPORTED_MODELS]
			
 
				+          if (!modelData) throw new Error(`Unsupported model: ${model}`)
			
 
				+
			
 
				+          const inputTokens = usage.inputTokens ?? 0
			
 
				+          const outputTokens = usage.outputTokens ?? 0
			
 
				+          const reasoningTokens = usage.reasoningTokens ?? 0
			
 
				+          const cacheReadTokens = usage.cachedInputTokens ?? 0
			
 
				+          const cacheWriteTokens =
			
 
				+            providerMetadata?.["anthropic"]?.["cacheCreationInputTokens"] ??
			
 
				+            // @ts-expect-error
			
 
				+            providerMetadata?.["bedrock"]?.["usage"]?.["cacheWriteInputTokens"] ??
			
 
				+            0
			
 
				+
			
 
				+          const inputCost = modelData.input * inputTokens
			
 
				+          const outputCost = modelData.output * outputTokens
			
 
				+          const reasoningCost = modelData.reasoning * reasoningTokens
			
 
				+          const cacheReadCost = modelData.cacheRead * cacheReadTokens
			
 
				+          const cacheWriteCost = modelData.cacheWrite * cacheWriteTokens
			
 
				+          const costInCents = (inputCost + outputCost + reasoningCost + cacheReadCost + cacheWriteCost) * 100
			
 
				+
			
 
				           await Billing.consume({
			
 
				             model,
			
 
				             inputTokens,
			
@@ -637,18 +651,18 @@ const app = new Hono<{ Bindings: Env; Variables: { keyRecord?: { id: string; wor
 
				             cacheWriteTokens,
			
 
				             costInCents,
			
 
				           })
			
 
				-        })
			
 
				 
			
 
				-        await Database.use((tx) =>
			
 
				-          tx
			
 
				-            .update(KeyTable)
			
 
				-            .set({ timeUsed: sql`now()` })
			
 
				-            .where(eq(KeyTable.id, keyRecord.id)),
			
 
				-        )
			
 
				+          await Database.use((tx) =>
			
 
				+            tx
			
 
				+              .update(KeyTable)
			
 
				+              .set({ timeUsed: sql`now()` })
			
 
				+              .where(eq(KeyTable.id, keyRecord.id)),
			
 
				+          )
			
 
				+        }
			
 
				+      } catch (error: any) {
			
 
				+        return c.json({ error: { message: error.message } }, 500)
			
 
				       }
			
 
				-    } catch (error: any) {
			
 
				-      return c.json({ error: { message: error.message } }, 500)
			
 
				-    }
			
 
				+    })
			
 
				   })
			
 
				   .use("/*", cors())
			
 
				   .use(RestAuth)
			
--- a/opencode.json
+++ b/opencode.json
@@ -1,25 +1,5 @@
 
				 {
			
 
				   "$schema": "https://opencode.ai/config.json",
			
 
				-  "provider": {
			
 
				-    "oc-frank": {
			
 
				-      "npm": "@ai-sdk/openai-compatible",
			
 
				-      "name": "OC-Frank",
			
 
				-      "options": {
			
 
				-        "baseURL": "https://api.gateway.frank.dev.opencode.ai/v1"
			
 
				-      },
			
 
				-      "models": {
			
 
				-        "anthropic/claude-sonnet-4": {
			
 
				-          "name": "Claude Sonnet 4"
			
 
				-        },
			
 
				-        "openai/gpt-4.1": {
			
 
				-          "name": "GPT-4.1"
			
 
				-        },
			
 
				-        "zhipuai/glm-4.5-flash": {
			
 
				-          "name": "GLM-4.5 Flash"
			
 
				-        }
			
 
				-      }
			
 
				-    }
			
 
				-  },
			
 
				   "mcp": {
			
 
				     "context7": {
			
 
				       "type": "remote",