billing-model-source.test.ts 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696
  1. import { beforeEach, describe, expect, it, vi } from "vitest";
  2. import type { ModelPrice, ModelPriceData } from "@/types/model-price";
  3. import type { SystemSettings } from "@/types/system-config";
  4. const asyncTasks: Promise<void>[] = [];
  5. const cloudPriceSyncRequests: Array<{ reason: string }> = [];
  6. vi.mock("@/lib/async-task-manager", () => ({
  7. AsyncTaskManager: {
  8. register: (_taskId: string, promise: Promise<void>) => {
  9. asyncTasks.push(promise);
  10. return new AbortController();
  11. },
  12. cleanup: () => {},
  13. cancel: () => {},
  14. },
  15. }));
  16. vi.mock("@/lib/logger", () => ({
  17. logger: {
  18. debug: () => {},
  19. info: () => {},
  20. warn: () => {},
  21. error: () => {},
  22. trace: () => {},
  23. },
  24. }));
  25. vi.mock("@/lib/price-sync/cloud-price-updater", () => ({
  26. requestCloudPriceTableSync: (payload: { reason: string }) => {
  27. cloudPriceSyncRequests.push(payload);
  28. },
  29. }));
  30. vi.mock("@/repository/model-price", () => ({
  31. findLatestPriceByModel: vi.fn(),
  32. }));
  33. vi.mock("@/repository/system-config", () => ({
  34. getSystemSettings: vi.fn(),
  35. }));
  36. vi.mock("@/repository/message", () => ({
  37. updateMessageRequestCost: vi.fn(),
  38. updateMessageRequestDetails: vi.fn(),
  39. updateMessageRequestDuration: vi.fn(),
  40. }));
  41. vi.mock("@/lib/session-manager", () => ({
  42. SessionManager: {
  43. updateSessionUsage: vi.fn(),
  44. storeSessionResponse: vi.fn(),
  45. extractCodexPromptCacheKey: vi.fn(),
  46. updateSessionWithCodexCacheKey: vi.fn(),
  47. },
  48. }));
  49. vi.mock("@/lib/rate-limit", () => ({
  50. RateLimitService: {
  51. trackCost: vi.fn(),
  52. trackUserDailyCost: vi.fn(),
  53. },
  54. }));
  55. vi.mock("@/lib/session-tracker", () => ({
  56. SessionTracker: {
  57. refreshSession: vi.fn(),
  58. },
  59. }));
  60. vi.mock("@/lib/proxy-status-tracker", () => ({
  61. ProxyStatusTracker: {
  62. getInstance: () => ({
  63. endRequest: () => {},
  64. }),
  65. },
  66. }));
  67. import { ProxyResponseHandler } from "@/app/v1/_lib/proxy/response-handler";
  68. import { ProxySession } from "@/app/v1/_lib/proxy/session";
  69. import { SessionManager } from "@/lib/session-manager";
  70. import { RateLimitService } from "@/lib/rate-limit";
  71. import { SessionTracker } from "@/lib/session-tracker";
  72. import {
  73. updateMessageRequestCost,
  74. updateMessageRequestDetails,
  75. updateMessageRequestDuration,
  76. } from "@/repository/message";
  77. import { findLatestPriceByModel } from "@/repository/model-price";
  78. import { getSystemSettings } from "@/repository/system-config";
  79. beforeEach(() => {
  80. cloudPriceSyncRequests.splice(0, cloudPriceSyncRequests.length);
  81. });
  82. function makeSystemSettings(
  83. billingModelSource: SystemSettings["billingModelSource"]
  84. ): SystemSettings {
  85. const now = new Date();
  86. return {
  87. id: 1,
  88. siteTitle: "test",
  89. allowGlobalUsageView: false,
  90. currencyDisplay: "USD",
  91. billingModelSource,
  92. timezone: null,
  93. enableAutoCleanup: false,
  94. cleanupRetentionDays: 30,
  95. cleanupSchedule: "0 2 * * *",
  96. cleanupBatchSize: 10000,
  97. enableClientVersionCheck: false,
  98. verboseProviderError: false,
  99. enableHttp2: false,
  100. enableResponsesWebSocket: false,
  101. interceptAnthropicWarmupRequests: false,
  102. enableResponseFixer: true,
  103. responseFixerConfig: {
  104. fixTruncatedJson: true,
  105. fixSseFormat: true,
  106. fixEncoding: true,
  107. maxJsonDepth: 200,
  108. maxFixSize: 1024 * 1024,
  109. },
  110. createdAt: now,
  111. updatedAt: now,
  112. };
  113. }
  114. function makePriceRecord(modelName: string, priceData: ModelPriceData): ModelPrice {
  115. const now = new Date();
  116. return {
  117. id: 1,
  118. modelName,
  119. priceData,
  120. createdAt: now,
  121. updatedAt: now,
  122. };
  123. }
  124. function createSession({
  125. originalModel,
  126. redirectedModel,
  127. sessionId,
  128. messageId,
  129. providerOverrides,
  130. requestMessage,
  131. }: {
  132. originalModel: string;
  133. redirectedModel: string;
  134. sessionId: string;
  135. messageId: number;
  136. providerOverrides?: Record<string, unknown>;
  137. requestMessage?: Record<string, unknown>;
  138. }): ProxySession {
  139. const session = new (
  140. ProxySession as unknown as {
  141. new (init: {
  142. startTime: number;
  143. method: string;
  144. requestUrl: URL;
  145. headers: Headers;
  146. headerLog: string;
  147. request: { message: Record<string, unknown>; log: string; model: string | null };
  148. userAgent: string | null;
  149. context: unknown;
  150. clientAbortSignal: AbortSignal | null;
  151. }): ProxySession;
  152. }
  153. )({
  154. startTime: Date.now(),
  155. method: "POST",
  156. requestUrl: new URL("http://localhost/v1/messages"),
  157. headers: new Headers(),
  158. headerLog: "",
  159. request: { message: requestMessage ?? {}, log: "(test)", model: redirectedModel },
  160. userAgent: null,
  161. context: {},
  162. clientAbortSignal: null,
  163. });
  164. session.setOriginalModel(originalModel);
  165. session.setSessionId(sessionId);
  166. const provider = {
  167. id: 99,
  168. name: "test-provider",
  169. url: "https://api.anthropic.com",
  170. providerType: "claude",
  171. costMultiplier: 1.0,
  172. streamingIdleTimeoutMs: 0,
  173. ...providerOverrides,
  174. } as any;
  175. const user = {
  176. id: 123,
  177. name: "test-user",
  178. dailyResetTime: "00:00",
  179. dailyResetMode: "fixed",
  180. } as any;
  181. const key = {
  182. id: 456,
  183. name: "test-key",
  184. dailyResetTime: "00:00",
  185. dailyResetMode: "fixed",
  186. } as any;
  187. session.setProvider(provider);
  188. session.setAuthState({
  189. user,
  190. key,
  191. apiKey: "sk-test",
  192. success: true,
  193. });
  194. session.setMessageContext({
  195. id: messageId,
  196. createdAt: new Date(),
  197. user,
  198. key,
  199. apiKey: "sk-test",
  200. });
  201. return session;
  202. }
  203. function createNonStreamResponse(
  204. usage: { input_tokens: number; output_tokens: number },
  205. extras?: Record<string, unknown>
  206. ): Response {
  207. return new Response(
  208. JSON.stringify({
  209. type: "message",
  210. usage,
  211. ...(extras ?? {}),
  212. }),
  213. {
  214. status: 200,
  215. headers: { "content-type": "application/json" },
  216. }
  217. );
  218. }
  219. function createStreamResponse(usage: { input_tokens: number; output_tokens: number }): Response {
  220. const sseText = `event: message_delta\ndata: ${JSON.stringify({ usage })}\n\n`;
  221. const encoder = new TextEncoder();
  222. const stream = new ReadableStream<Uint8Array>({
  223. start(controller) {
  224. controller.enqueue(encoder.encode(sseText));
  225. controller.close();
  226. },
  227. });
  228. return new Response(stream, {
  229. status: 200,
  230. headers: { "content-type": "text/event-stream" },
  231. });
  232. }
  233. async function drainAsyncTasks(): Promise<void> {
  234. const tasks = asyncTasks.splice(0, asyncTasks.length);
  235. await Promise.all(tasks);
  236. }
  237. async function runScenario({
  238. billingModelSource,
  239. isStream,
  240. }: {
  241. billingModelSource: SystemSettings["billingModelSource"];
  242. isStream: boolean;
  243. }): Promise<{ dbCostUsd: string; sessionCostUsd: string; rateLimitCost: number }> {
  244. const usage = { input_tokens: 2, output_tokens: 3 };
  245. const originalModel = "original-model";
  246. const redirectedModel = "redirected-model";
  247. const originalPriceData: ModelPriceData = { input_cost_per_token: 1, output_cost_per_token: 1 };
  248. const redirectedPriceData: ModelPriceData = {
  249. input_cost_per_token: 10,
  250. output_cost_per_token: 10,
  251. };
  252. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings(billingModelSource));
  253. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  254. if (modelName === originalModel) {
  255. return makePriceRecord(modelName, originalPriceData);
  256. }
  257. if (modelName === redirectedModel) {
  258. return makePriceRecord(modelName, redirectedPriceData);
  259. }
  260. return null;
  261. });
  262. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  263. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  264. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  265. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  266. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  267. const dbCosts: string[] = [];
  268. vi.mocked(updateMessageRequestCost).mockImplementation(async (_id: number, costUsd: unknown) => {
  269. dbCosts.push(String(costUsd));
  270. });
  271. const sessionCosts: string[] = [];
  272. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  273. async (_sessionId: string, payload: Record<string, unknown>) => {
  274. if (typeof payload.costUsd === "string") {
  275. sessionCosts.push(payload.costUsd);
  276. }
  277. }
  278. );
  279. const rateLimitCosts: number[] = [];
  280. vi.mocked(RateLimitService.trackCost).mockImplementation(
  281. async (_keyId: number, _providerId: number, _sessionId: string, costUsd: number) => {
  282. rateLimitCosts.push(costUsd);
  283. }
  284. );
  285. const session = createSession({
  286. originalModel,
  287. redirectedModel,
  288. sessionId: `sess-${billingModelSource}-${isStream ? "s" : "n"}`,
  289. messageId: isStream ? 2001 : 2000,
  290. });
  291. const response = isStream ? createStreamResponse(usage) : createNonStreamResponse(usage);
  292. const clientResponse = await ProxyResponseHandler.dispatch(session, response);
  293. if (isStream) {
  294. await clientResponse.text();
  295. }
  296. await drainAsyncTasks();
  297. const dbCostUsd = dbCosts[0] ?? "";
  298. const sessionCostUsd = sessionCosts[0] ?? "";
  299. const rateLimitCost = rateLimitCosts[0] ?? Number.NaN;
  300. return { dbCostUsd, sessionCostUsd, rateLimitCost };
  301. }
  302. describe("Billing model source - Redis session cost vs DB cost", () => {
  303. it("非流式响应:配置 = original 时 Session 成本与数据库一致", async () => {
  304. const result = await runScenario({ billingModelSource: "original", isStream: false });
  305. expect(result.dbCostUsd).toBe("5");
  306. expect(result.sessionCostUsd).toBe("5");
  307. expect(result.rateLimitCost).toBe(5);
  308. });
  309. it("非流式响应:配置 = redirected 时 Session 成本与数据库一致", async () => {
  310. const result = await runScenario({ billingModelSource: "redirected", isStream: false });
  311. expect(result.dbCostUsd).toBe("50");
  312. expect(result.sessionCostUsd).toBe("50");
  313. expect(result.rateLimitCost).toBe(50);
  314. });
  315. it("流式响应:配置 = original 时 Session 成本与数据库一致", async () => {
  316. const result = await runScenario({ billingModelSource: "original", isStream: true });
  317. expect(result.dbCostUsd).toBe("5");
  318. expect(result.sessionCostUsd).toBe("5");
  319. expect(result.rateLimitCost).toBe(5);
  320. });
  321. it("流式响应:配置 = redirected 时 Session 成本与数据库一致", async () => {
  322. const result = await runScenario({ billingModelSource: "redirected", isStream: true });
  323. expect(result.dbCostUsd).toBe("50");
  324. expect(result.sessionCostUsd).toBe("50");
  325. expect(result.rateLimitCost).toBe(50);
  326. });
  327. it("从 original 切换到 redirected 后应生效", async () => {
  328. const original = await runScenario({ billingModelSource: "original", isStream: false });
  329. const redirected = await runScenario({ billingModelSource: "redirected", isStream: false });
  330. expect(original.sessionCostUsd).toBe("5");
  331. expect(redirected.sessionCostUsd).toBe("50");
  332. expect(original.sessionCostUsd).not.toBe(redirected.sessionCostUsd);
  333. });
  334. it("nested pricing: gpt-5.4 alias model should bill from pricing.openai when provider is chatgpt", async () => {
  335. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  336. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  337. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  338. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  339. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  340. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  341. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  342. if (modelName === "gpt-5.4") {
  343. return makePriceRecord(modelName, {
  344. mode: "responses",
  345. model_family: "gpt",
  346. litellm_provider: "chatgpt",
  347. pricing: {
  348. openai: {
  349. input_cost_per_token: 2.5,
  350. output_cost_per_token: 15,
  351. },
  352. },
  353. });
  354. }
  355. return null;
  356. });
  357. const dbCosts: string[] = [];
  358. vi.mocked(updateMessageRequestCost).mockImplementation(
  359. async (_id: number, costUsd: unknown) => {
  360. dbCosts.push(String(costUsd));
  361. }
  362. );
  363. const sessionCosts: string[] = [];
  364. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  365. async (_sessionId: string, payload: Record<string, unknown>) => {
  366. if (typeof payload.costUsd === "string") {
  367. sessionCosts.push(payload.costUsd);
  368. }
  369. }
  370. );
  371. const session = createSession({
  372. originalModel: "gpt-5.4",
  373. redirectedModel: "gpt-5.4",
  374. sessionId: "sess-gpt54-chatgpt",
  375. messageId: 3100,
  376. providerOverrides: {
  377. name: "ChatGPT",
  378. url: "https://chatgpt.com/backend-api/codex",
  379. providerType: "codex",
  380. },
  381. });
  382. const response = createNonStreamResponse({ input_tokens: 2, output_tokens: 3 });
  383. await ProxyResponseHandler.dispatch(session, response);
  384. await drainAsyncTasks();
  385. expect(dbCosts[0]).toBe("50");
  386. expect(sessionCosts[0]).toBe("50");
  387. });
  388. it("codex fast: uses priority pricing when response reports service_tier=priority", async () => {
  389. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  390. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  391. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  392. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  393. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  394. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  395. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  396. if (modelName === "gpt-5.4") {
  397. return makePriceRecord(modelName, {
  398. mode: "responses",
  399. model_family: "gpt",
  400. litellm_provider: "chatgpt",
  401. pricing: {
  402. openai: {
  403. input_cost_per_token: 1,
  404. output_cost_per_token: 10,
  405. input_cost_per_token_priority: 2,
  406. output_cost_per_token_priority: 20,
  407. },
  408. },
  409. });
  410. }
  411. return null;
  412. });
  413. const dbCosts: string[] = [];
  414. vi.mocked(updateMessageRequestCost).mockImplementation(
  415. async (_id: number, costUsd: unknown) => {
  416. dbCosts.push(String(costUsd));
  417. }
  418. );
  419. const sessionCosts: string[] = [];
  420. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  421. async (_sessionId: string, payload: Record<string, unknown>) => {
  422. if (typeof payload.costUsd === "string") {
  423. sessionCosts.push(payload.costUsd);
  424. }
  425. }
  426. );
  427. const session = createSession({
  428. originalModel: "gpt-5.4",
  429. redirectedModel: "gpt-5.4",
  430. sessionId: "sess-gpt54-priority-actual",
  431. messageId: 3200,
  432. providerOverrides: {
  433. name: "ChatGPT",
  434. url: "https://chatgpt.com/backend-api/codex",
  435. providerType: "codex",
  436. },
  437. requestMessage: { service_tier: "default" },
  438. });
  439. const response = createNonStreamResponse(
  440. { input_tokens: 2, output_tokens: 3 },
  441. { service_tier: "priority" }
  442. );
  443. await ProxyResponseHandler.dispatch(session, response);
  444. await drainAsyncTasks();
  445. expect(dbCosts[0]).toBe("64");
  446. expect(sessionCosts[0]).toBe("64");
  447. });
  448. it("codex fast: falls back to requested priority pricing when response omits service_tier", async () => {
  449. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  450. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  451. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  452. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  453. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  454. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  455. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  456. if (modelName === "gpt-5.4") {
  457. return makePriceRecord(modelName, {
  458. mode: "responses",
  459. model_family: "gpt",
  460. litellm_provider: "chatgpt",
  461. pricing: {
  462. openai: {
  463. input_cost_per_token: 1,
  464. output_cost_per_token: 10,
  465. input_cost_per_token_priority: 2,
  466. output_cost_per_token_priority: 20,
  467. },
  468. },
  469. });
  470. }
  471. return null;
  472. });
  473. const dbCosts: string[] = [];
  474. vi.mocked(updateMessageRequestCost).mockImplementation(
  475. async (_id: number, costUsd: unknown) => {
  476. dbCosts.push(String(costUsd));
  477. }
  478. );
  479. const session = createSession({
  480. originalModel: "gpt-5.4",
  481. redirectedModel: "gpt-5.4",
  482. sessionId: "sess-gpt54-priority-requested",
  483. messageId: 3201,
  484. providerOverrides: {
  485. name: "ChatGPT",
  486. url: "https://chatgpt.com/backend-api/codex",
  487. providerType: "codex",
  488. },
  489. requestMessage: { service_tier: "priority" },
  490. });
  491. const response = createNonStreamResponse({ input_tokens: 2, output_tokens: 3 });
  492. await ProxyResponseHandler.dispatch(session, response);
  493. await drainAsyncTasks();
  494. expect(dbCosts[0]).toBe("64");
  495. });
  496. it("codex fast: does not use priority pricing when response explicitly reports non-priority tier", async () => {
  497. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  498. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  499. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  500. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  501. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  502. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  503. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  504. if (modelName === "gpt-5.4") {
  505. return makePriceRecord(modelName, {
  506. mode: "responses",
  507. model_family: "gpt",
  508. litellm_provider: "chatgpt",
  509. pricing: {
  510. openai: {
  511. input_cost_per_token: 1,
  512. output_cost_per_token: 10,
  513. input_cost_per_token_priority: 2,
  514. output_cost_per_token_priority: 20,
  515. },
  516. },
  517. });
  518. }
  519. return null;
  520. });
  521. const dbCosts: string[] = [];
  522. vi.mocked(updateMessageRequestCost).mockImplementation(
  523. async (_id: number, costUsd: unknown) => {
  524. dbCosts.push(String(costUsd));
  525. }
  526. );
  527. const session = createSession({
  528. originalModel: "gpt-5.4",
  529. redirectedModel: "gpt-5.4",
  530. sessionId: "sess-gpt54-priority-downgraded",
  531. messageId: 3202,
  532. providerOverrides: {
  533. name: "ChatGPT",
  534. url: "https://chatgpt.com/backend-api/codex",
  535. providerType: "codex",
  536. },
  537. requestMessage: { service_tier: "priority" },
  538. });
  539. const response = createNonStreamResponse(
  540. { input_tokens: 2, output_tokens: 3 },
  541. { service_tier: "default" }
  542. );
  543. await ProxyResponseHandler.dispatch(session, response);
  544. await drainAsyncTasks();
  545. expect(dbCosts[0]).toBe("32");
  546. });
  547. });
  548. describe("价格表缺失/查询失败:不计费放行", () => {
  549. async function runNoPriceScenario(options: {
  550. billingModelSource: SystemSettings["billingModelSource"];
  551. isStream: boolean;
  552. priceLookup: "none" | "throws";
  553. }): Promise<{ dbCostCalls: number; rateLimitCalls: number }> {
  554. const usage = { input_tokens: 2, output_tokens: 3 };
  555. const originalModel = "original-model";
  556. const redirectedModel = "redirected-model";
  557. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings(options.billingModelSource));
  558. if (options.priceLookup === "none") {
  559. vi.mocked(findLatestPriceByModel).mockResolvedValue(null);
  560. } else {
  561. vi.mocked(findLatestPriceByModel).mockImplementation(async () => {
  562. throw new Error("db query failed");
  563. });
  564. }
  565. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  566. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  567. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  568. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  569. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  570. vi.mocked(updateMessageRequestCost).mockResolvedValue(undefined);
  571. vi.mocked(RateLimitService.trackCost).mockResolvedValue(undefined);
  572. vi.mocked(SessionManager.updateSessionUsage).mockResolvedValue(undefined);
  573. const session = createSession({
  574. originalModel,
  575. redirectedModel,
  576. sessionId: `sess-no-price-${options.billingModelSource}-${options.isStream ? "s" : "n"}`,
  577. messageId: options.isStream ? 3001 : 3000,
  578. });
  579. const response = options.isStream
  580. ? createStreamResponse(usage)
  581. : createNonStreamResponse(usage);
  582. const clientResponse = await ProxyResponseHandler.dispatch(session, response);
  583. await clientResponse.text();
  584. await drainAsyncTasks();
  585. return {
  586. dbCostCalls: vi.mocked(updateMessageRequestCost).mock.calls.length,
  587. rateLimitCalls: vi.mocked(RateLimitService.trackCost).mock.calls.length,
  588. };
  589. }
  590. it("无价格:不写入 DB cost,不追踪限流 cost,并触发一次异步同步", async () => {
  591. const result = await runNoPriceScenario({
  592. billingModelSource: "redirected",
  593. isStream: false,
  594. priceLookup: "none",
  595. });
  596. expect(result.dbCostCalls).toBe(0);
  597. expect(result.rateLimitCalls).toBe(0);
  598. expect(cloudPriceSyncRequests).toEqual([{ reason: "missing-model" }]);
  599. });
  600. it("价格查询抛错:不应影响响应,不写入 DB cost,不追踪限流 cost", async () => {
  601. const result = await runNoPriceScenario({
  602. billingModelSource: "original",
  603. isStream: true,
  604. priceLookup: "throws",
  605. });
  606. expect(result.dbCostCalls).toBe(0);
  607. expect(result.rateLimitCalls).toBe(0);
  608. });
  609. });