billing-model-source.test.ts 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763
  1. import { beforeEach, describe, expect, it, vi } from "vitest";
  2. import type { ModelPrice, ModelPriceData } from "@/types/model-price";
  3. import type { SystemSettings } from "@/types/system-config";
  4. const asyncTasks: Promise<void>[] = [];
  5. const cloudPriceSyncRequests: Array<{ reason: string }> = [];
  6. vi.mock("@/lib/async-task-manager", () => ({
  7. AsyncTaskManager: {
  8. register: (_taskId: string, promise: Promise<void>) => {
  9. asyncTasks.push(promise);
  10. return new AbortController();
  11. },
  12. cleanup: () => {},
  13. cancel: () => {},
  14. },
  15. }));
  16. vi.mock("@/lib/logger", () => ({
  17. logger: {
  18. debug: () => {},
  19. info: () => {},
  20. warn: () => {},
  21. error: () => {},
  22. trace: () => {},
  23. },
  24. }));
  25. vi.mock("@/lib/price-sync/cloud-price-updater", () => ({
  26. requestCloudPriceTableSync: (payload: { reason: string }) => {
  27. cloudPriceSyncRequests.push(payload);
  28. },
  29. }));
  30. vi.mock("@/repository/model-price", () => ({
  31. findLatestPriceByModel: vi.fn(),
  32. }));
  33. vi.mock("@/repository/system-config", () => ({
  34. getSystemSettings: vi.fn(),
  35. }));
  36. vi.mock("@/repository/message", () => ({
  37. updateMessageRequestCost: vi.fn(),
  38. updateMessageRequestDetails: vi.fn(),
  39. updateMessageRequestDuration: vi.fn(),
  40. }));
  41. vi.mock("@/lib/session-manager", () => ({
  42. SessionManager: {
  43. updateSessionUsage: vi.fn(),
  44. storeSessionResponse: vi.fn(),
  45. extractCodexPromptCacheKey: vi.fn(),
  46. updateSessionWithCodexCacheKey: vi.fn(),
  47. },
  48. }));
  49. vi.mock("@/lib/rate-limit", () => ({
  50. RateLimitService: {
  51. trackCost: vi.fn(),
  52. trackUserDailyCost: vi.fn(),
  53. },
  54. }));
  55. vi.mock("@/lib/session-tracker", () => ({
  56. SessionTracker: {
  57. refreshSession: vi.fn(),
  58. },
  59. }));
  60. vi.mock("@/lib/proxy-status-tracker", () => ({
  61. ProxyStatusTracker: {
  62. getInstance: () => ({
  63. endRequest: () => {},
  64. }),
  65. },
  66. }));
  67. import { ProxyResponseHandler } from "@/app/v1/_lib/proxy/response-handler";
  68. import { ProxySession } from "@/app/v1/_lib/proxy/session";
  69. import { SessionManager } from "@/lib/session-manager";
  70. import { RateLimitService } from "@/lib/rate-limit";
  71. import { SessionTracker } from "@/lib/session-tracker";
  72. import {
  73. updateMessageRequestCost,
  74. updateMessageRequestDetails,
  75. updateMessageRequestDuration,
  76. } from "@/repository/message";
  77. import { findLatestPriceByModel } from "@/repository/model-price";
  78. import { getSystemSettings } from "@/repository/system-config";
  79. beforeEach(() => {
  80. cloudPriceSyncRequests.splice(0, cloudPriceSyncRequests.length);
  81. });
  82. function makeSystemSettings(
  83. billingModelSource: SystemSettings["billingModelSource"]
  84. ): SystemSettings {
  85. const now = new Date();
  86. return {
  87. id: 1,
  88. siteTitle: "test",
  89. allowGlobalUsageView: false,
  90. currencyDisplay: "USD",
  91. billingModelSource,
  92. timezone: null,
  93. enableAutoCleanup: false,
  94. cleanupRetentionDays: 30,
  95. cleanupSchedule: "0 2 * * *",
  96. cleanupBatchSize: 10000,
  97. enableClientVersionCheck: false,
  98. verboseProviderError: false,
  99. enableHttp2: false,
  100. interceptAnthropicWarmupRequests: false,
  101. enableResponseFixer: true,
  102. responseFixerConfig: {
  103. fixTruncatedJson: true,
  104. fixSseFormat: true,
  105. fixEncoding: true,
  106. maxJsonDepth: 200,
  107. maxFixSize: 1024 * 1024,
  108. },
  109. createdAt: now,
  110. updatedAt: now,
  111. };
  112. }
  113. function makePriceRecord(modelName: string, priceData: ModelPriceData): ModelPrice {
  114. const now = new Date();
  115. return {
  116. id: 1,
  117. modelName,
  118. priceData,
  119. createdAt: now,
  120. updatedAt: now,
  121. };
  122. }
  123. function createSession({
  124. originalModel,
  125. redirectedModel,
  126. sessionId,
  127. messageId,
  128. providerOverrides,
  129. requestMessage,
  130. }: {
  131. originalModel: string;
  132. redirectedModel: string;
  133. sessionId: string;
  134. messageId: number;
  135. providerOverrides?: Record<string, unknown>;
  136. requestMessage?: Record<string, unknown>;
  137. }): ProxySession {
  138. const session = new (
  139. ProxySession as unknown as {
  140. new (init: {
  141. startTime: number;
  142. method: string;
  143. requestUrl: URL;
  144. headers: Headers;
  145. headerLog: string;
  146. request: { message: Record<string, unknown>; log: string; model: string | null };
  147. userAgent: string | null;
  148. context: unknown;
  149. clientAbortSignal: AbortSignal | null;
  150. }): ProxySession;
  151. }
  152. )({
  153. startTime: Date.now(),
  154. method: "POST",
  155. requestUrl: new URL("http://localhost/v1/messages"),
  156. headers: new Headers(),
  157. headerLog: "",
  158. request: { message: requestMessage ?? {}, log: "(test)", model: redirectedModel },
  159. userAgent: null,
  160. context: {},
  161. clientAbortSignal: null,
  162. });
  163. session.setOriginalModel(originalModel);
  164. session.setSessionId(sessionId);
  165. const provider = {
  166. id: 99,
  167. name: "test-provider",
  168. url: "https://api.anthropic.com",
  169. providerType: "claude",
  170. costMultiplier: 1.0,
  171. streamingIdleTimeoutMs: 0,
  172. ...providerOverrides,
  173. } as any;
  174. const user = {
  175. id: 123,
  176. name: "test-user",
  177. dailyResetTime: "00:00",
  178. dailyResetMode: "fixed",
  179. } as any;
  180. const key = {
  181. id: 456,
  182. name: "test-key",
  183. dailyResetTime: "00:00",
  184. dailyResetMode: "fixed",
  185. } as any;
  186. session.setProvider(provider);
  187. session.setAuthState({
  188. user,
  189. key,
  190. apiKey: "sk-test",
  191. success: true,
  192. });
  193. session.setMessageContext({
  194. id: messageId,
  195. createdAt: new Date(),
  196. user,
  197. key,
  198. apiKey: "sk-test",
  199. });
  200. return session;
  201. }
  202. function createNonStreamResponse(
  203. usage: { input_tokens: number; output_tokens: number },
  204. extras?: Record<string, unknown>
  205. ): Response {
  206. return new Response(
  207. JSON.stringify({
  208. type: "message",
  209. usage,
  210. ...(extras ?? {}),
  211. }),
  212. {
  213. status: 200,
  214. headers: { "content-type": "application/json" },
  215. }
  216. );
  217. }
  218. function createStreamResponse(usage: { input_tokens: number; output_tokens: number }): Response {
  219. const sseText = `event: message_delta\ndata: ${JSON.stringify({ usage })}\n\n`;
  220. const encoder = new TextEncoder();
  221. const stream = new ReadableStream<Uint8Array>({
  222. start(controller) {
  223. controller.enqueue(encoder.encode(sseText));
  224. controller.close();
  225. },
  226. });
  227. return new Response(stream, {
  228. status: 200,
  229. headers: { "content-type": "text/event-stream" },
  230. });
  231. }
  232. async function drainAsyncTasks(): Promise<void> {
  233. const tasks = asyncTasks.splice(0, asyncTasks.length);
  234. await Promise.all(tasks);
  235. }
  236. async function runScenario({
  237. billingModelSource,
  238. isStream,
  239. }: {
  240. billingModelSource: SystemSettings["billingModelSource"];
  241. isStream: boolean;
  242. }): Promise<{ dbCostUsd: string; sessionCostUsd: string; rateLimitCost: number }> {
  243. const usage = { input_tokens: 2, output_tokens: 3 };
  244. const originalModel = "original-model";
  245. const redirectedModel = "redirected-model";
  246. const originalPriceData: ModelPriceData = { input_cost_per_token: 1, output_cost_per_token: 1 };
  247. const redirectedPriceData: ModelPriceData = {
  248. input_cost_per_token: 10,
  249. output_cost_per_token: 10,
  250. };
  251. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings(billingModelSource));
  252. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  253. if (modelName === originalModel) {
  254. return makePriceRecord(modelName, originalPriceData);
  255. }
  256. if (modelName === redirectedModel) {
  257. return makePriceRecord(modelName, redirectedPriceData);
  258. }
  259. return null;
  260. });
  261. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  262. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  263. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  264. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  265. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  266. const dbCosts: string[] = [];
  267. vi.mocked(updateMessageRequestCost).mockImplementation(async (_id: number, costUsd: unknown) => {
  268. dbCosts.push(String(costUsd));
  269. });
  270. const sessionCosts: string[] = [];
  271. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  272. async (_sessionId: string, payload: Record<string, unknown>) => {
  273. if (typeof payload.costUsd === "string") {
  274. sessionCosts.push(payload.costUsd);
  275. }
  276. }
  277. );
  278. const rateLimitCosts: number[] = [];
  279. vi.mocked(RateLimitService.trackCost).mockImplementation(
  280. async (_keyId: number, _providerId: number, _sessionId: string, costUsd: number) => {
  281. rateLimitCosts.push(costUsd);
  282. }
  283. );
  284. const session = createSession({
  285. originalModel,
  286. redirectedModel,
  287. sessionId: `sess-${billingModelSource}-${isStream ? "s" : "n"}`,
  288. messageId: isStream ? 2001 : 2000,
  289. });
  290. const response = isStream ? createStreamResponse(usage) : createNonStreamResponse(usage);
  291. const clientResponse = await ProxyResponseHandler.dispatch(session, response);
  292. if (isStream) {
  293. await clientResponse.text();
  294. }
  295. await drainAsyncTasks();
  296. const dbCostUsd = dbCosts[0] ?? "";
  297. const sessionCostUsd = sessionCosts[0] ?? "";
  298. const rateLimitCost = rateLimitCosts[0] ?? Number.NaN;
  299. return { dbCostUsd, sessionCostUsd, rateLimitCost };
  300. }
  301. describe("Billing model source - Redis session cost vs DB cost", () => {
  302. it("非流式响应:配置 = original 时 Session 成本与数据库一致", async () => {
  303. const result = await runScenario({ billingModelSource: "original", isStream: false });
  304. expect(result.dbCostUsd).toBe("5");
  305. expect(result.sessionCostUsd).toBe("5");
  306. expect(result.rateLimitCost).toBe(5);
  307. });
  308. it("非流式响应:配置 = redirected 时 Session 成本与数据库一致", async () => {
  309. const result = await runScenario({ billingModelSource: "redirected", isStream: false });
  310. expect(result.dbCostUsd).toBe("50");
  311. expect(result.sessionCostUsd).toBe("50");
  312. expect(result.rateLimitCost).toBe(50);
  313. });
  314. it("流式响应:配置 = original 时 Session 成本与数据库一致", async () => {
  315. const result = await runScenario({ billingModelSource: "original", isStream: true });
  316. expect(result.dbCostUsd).toBe("5");
  317. expect(result.sessionCostUsd).toBe("5");
  318. expect(result.rateLimitCost).toBe(5);
  319. });
  320. it("流式响应:配置 = redirected 时 Session 成本与数据库一致", async () => {
  321. const result = await runScenario({ billingModelSource: "redirected", isStream: true });
  322. expect(result.dbCostUsd).toBe("50");
  323. expect(result.sessionCostUsd).toBe("50");
  324. expect(result.rateLimitCost).toBe(50);
  325. });
  326. it("从 original 切换到 redirected 后应生效", async () => {
  327. const original = await runScenario({ billingModelSource: "original", isStream: false });
  328. const redirected = await runScenario({ billingModelSource: "redirected", isStream: false });
  329. expect(original.sessionCostUsd).toBe("5");
  330. expect(redirected.sessionCostUsd).toBe("50");
  331. expect(original.sessionCostUsd).not.toBe(redirected.sessionCostUsd);
  332. });
  333. it("nested pricing: gpt-5.4 alias model should bill from pricing.openai when provider is chatgpt", async () => {
  334. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  335. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  336. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  337. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  338. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  339. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  340. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  341. if (modelName === "gpt-5.4") {
  342. return makePriceRecord(modelName, {
  343. mode: "responses",
  344. model_family: "gpt",
  345. litellm_provider: "chatgpt",
  346. pricing: {
  347. openai: {
  348. input_cost_per_token: 2.5,
  349. output_cost_per_token: 15,
  350. },
  351. },
  352. });
  353. }
  354. return null;
  355. });
  356. const dbCosts: string[] = [];
  357. vi.mocked(updateMessageRequestCost).mockImplementation(
  358. async (_id: number, costUsd: unknown) => {
  359. dbCosts.push(String(costUsd));
  360. }
  361. );
  362. const sessionCosts: string[] = [];
  363. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  364. async (_sessionId: string, payload: Record<string, unknown>) => {
  365. if (typeof payload.costUsd === "string") {
  366. sessionCosts.push(payload.costUsd);
  367. }
  368. }
  369. );
  370. const session = createSession({
  371. originalModel: "gpt-5.4",
  372. redirectedModel: "gpt-5.4",
  373. sessionId: "sess-gpt54-chatgpt",
  374. messageId: 3100,
  375. providerOverrides: {
  376. name: "ChatGPT",
  377. url: "https://chatgpt.com/backend-api/codex",
  378. providerType: "codex",
  379. },
  380. });
  381. const response = createNonStreamResponse({ input_tokens: 2, output_tokens: 3 });
  382. await ProxyResponseHandler.dispatch(session, response);
  383. await drainAsyncTasks();
  384. expect(dbCosts[0]).toBe("50");
  385. expect(sessionCosts[0]).toBe("50");
  386. });
  387. it("codex fast: uses priority pricing when response reports service_tier=priority", async () => {
  388. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  389. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  390. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  391. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  392. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  393. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  394. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  395. if (modelName === "gpt-5.4") {
  396. return makePriceRecord(modelName, {
  397. mode: "responses",
  398. model_family: "gpt",
  399. litellm_provider: "chatgpt",
  400. pricing: {
  401. openai: {
  402. input_cost_per_token: 1,
  403. output_cost_per_token: 10,
  404. input_cost_per_token_priority: 2,
  405. output_cost_per_token_priority: 20,
  406. },
  407. },
  408. });
  409. }
  410. return null;
  411. });
  412. const dbCosts: string[] = [];
  413. vi.mocked(updateMessageRequestCost).mockImplementation(
  414. async (_id: number, costUsd: unknown) => {
  415. dbCosts.push(String(costUsd));
  416. }
  417. );
  418. const sessionCosts: string[] = [];
  419. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  420. async (_sessionId: string, payload: Record<string, unknown>) => {
  421. if (typeof payload.costUsd === "string") {
  422. sessionCosts.push(payload.costUsd);
  423. }
  424. }
  425. );
  426. const session = createSession({
  427. originalModel: "gpt-5.4",
  428. redirectedModel: "gpt-5.4",
  429. sessionId: "sess-gpt54-priority-actual",
  430. messageId: 3200,
  431. providerOverrides: {
  432. name: "ChatGPT",
  433. url: "https://chatgpt.com/backend-api/codex",
  434. providerType: "codex",
  435. },
  436. requestMessage: { service_tier: "default" },
  437. });
  438. const response = createNonStreamResponse(
  439. { input_tokens: 2, output_tokens: 3 },
  440. { service_tier: "priority" }
  441. );
  442. await ProxyResponseHandler.dispatch(session, response);
  443. await drainAsyncTasks();
  444. expect(dbCosts[0]).toBe("64");
  445. expect(sessionCosts[0]).toBe("64");
  446. });
  447. it("codex fast: falls back to requested priority pricing when response omits service_tier", async () => {
  448. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  449. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  450. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  451. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  452. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  453. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  454. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  455. if (modelName === "gpt-5.4") {
  456. return makePriceRecord(modelName, {
  457. mode: "responses",
  458. model_family: "gpt",
  459. litellm_provider: "chatgpt",
  460. pricing: {
  461. openai: {
  462. input_cost_per_token: 1,
  463. output_cost_per_token: 10,
  464. input_cost_per_token_priority: 2,
  465. output_cost_per_token_priority: 20,
  466. },
  467. },
  468. });
  469. }
  470. return null;
  471. });
  472. const dbCosts: string[] = [];
  473. vi.mocked(updateMessageRequestCost).mockImplementation(
  474. async (_id: number, costUsd: unknown) => {
  475. dbCosts.push(String(costUsd));
  476. }
  477. );
  478. const session = createSession({
  479. originalModel: "gpt-5.4",
  480. redirectedModel: "gpt-5.4",
  481. sessionId: "sess-gpt54-priority-requested",
  482. messageId: 3201,
  483. providerOverrides: {
  484. name: "ChatGPT",
  485. url: "https://chatgpt.com/backend-api/codex",
  486. providerType: "codex",
  487. },
  488. requestMessage: { service_tier: "priority" },
  489. });
  490. const response = createNonStreamResponse({ input_tokens: 2, output_tokens: 3 });
  491. await ProxyResponseHandler.dispatch(session, response);
  492. await drainAsyncTasks();
  493. expect(dbCosts[0]).toBe("64");
  494. });
  495. it("codex fast: uses long-context priority pricing when request is priority and response omits service_tier", async () => {
  496. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  497. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  498. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  499. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  500. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  501. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  502. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  503. if (modelName === "gpt-5.4") {
  504. return makePriceRecord(modelName, {
  505. mode: "responses",
  506. model_family: "gpt",
  507. litellm_provider: "chatgpt",
  508. pricing: {
  509. openai: {
  510. input_cost_per_token: 1,
  511. output_cost_per_token: 10,
  512. input_cost_per_token_priority: 2,
  513. output_cost_per_token_priority: 20,
  514. input_cost_per_token_above_272k_tokens: 5,
  515. output_cost_per_token_above_272k_tokens: 50,
  516. input_cost_per_token_above_272k_tokens_priority: 7,
  517. output_cost_per_token_above_272k_tokens_priority: 70,
  518. },
  519. },
  520. });
  521. }
  522. return null;
  523. });
  524. const dbCosts: string[] = [];
  525. vi.mocked(updateMessageRequestCost).mockImplementation(
  526. async (_id: number, costUsd: unknown) => {
  527. dbCosts.push(String(costUsd));
  528. }
  529. );
  530. const sessionCosts: string[] = [];
  531. vi.mocked(SessionManager.updateSessionUsage).mockImplementation(
  532. async (_sessionId: string, payload: Record<string, unknown>) => {
  533. if (typeof payload.costUsd === "string") {
  534. sessionCosts.push(payload.costUsd);
  535. }
  536. }
  537. );
  538. const session = createSession({
  539. originalModel: "gpt-5.4",
  540. redirectedModel: "gpt-5.4",
  541. sessionId: "sess-gpt54-priority-requested-long-context",
  542. messageId: 3203,
  543. providerOverrides: {
  544. name: "ChatGPT",
  545. url: "https://chatgpt.com/backend-api/codex",
  546. providerType: "codex",
  547. },
  548. requestMessage: { service_tier: "priority" },
  549. });
  550. const response = createNonStreamResponse({ input_tokens: 272001, output_tokens: 2 });
  551. await ProxyResponseHandler.dispatch(session, response);
  552. await drainAsyncTasks();
  553. expect(dbCosts[0]).toBe("1904147");
  554. expect(sessionCosts[0]).toBe("1904147");
  555. });
  556. it("codex fast: does not use priority pricing when response explicitly reports non-priority tier", async () => {
  557. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings("redirected"));
  558. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  559. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  560. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  561. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  562. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  563. vi.mocked(findLatestPriceByModel).mockImplementation(async (modelName: string) => {
  564. if (modelName === "gpt-5.4") {
  565. return makePriceRecord(modelName, {
  566. mode: "responses",
  567. model_family: "gpt",
  568. litellm_provider: "chatgpt",
  569. pricing: {
  570. openai: {
  571. input_cost_per_token: 1,
  572. output_cost_per_token: 10,
  573. input_cost_per_token_priority: 2,
  574. output_cost_per_token_priority: 20,
  575. },
  576. },
  577. });
  578. }
  579. return null;
  580. });
  581. const dbCosts: string[] = [];
  582. vi.mocked(updateMessageRequestCost).mockImplementation(
  583. async (_id: number, costUsd: unknown) => {
  584. dbCosts.push(String(costUsd));
  585. }
  586. );
  587. const session = createSession({
  588. originalModel: "gpt-5.4",
  589. redirectedModel: "gpt-5.4",
  590. sessionId: "sess-gpt54-priority-downgraded",
  591. messageId: 3202,
  592. providerOverrides: {
  593. name: "ChatGPT",
  594. url: "https://chatgpt.com/backend-api/codex",
  595. providerType: "codex",
  596. },
  597. requestMessage: { service_tier: "priority" },
  598. });
  599. const response = createNonStreamResponse(
  600. { input_tokens: 2, output_tokens: 3 },
  601. { service_tier: "default" }
  602. );
  603. await ProxyResponseHandler.dispatch(session, response);
  604. await drainAsyncTasks();
  605. expect(dbCosts[0]).toBe("32");
  606. });
  607. });
  608. describe("价格表缺失/查询失败:不计费放行", () => {
  609. async function runNoPriceScenario(options: {
  610. billingModelSource: SystemSettings["billingModelSource"];
  611. isStream: boolean;
  612. priceLookup: "none" | "throws";
  613. }): Promise<{ dbCostCalls: number; rateLimitCalls: number }> {
  614. const usage = { input_tokens: 2, output_tokens: 3 };
  615. const originalModel = "original-model";
  616. const redirectedModel = "redirected-model";
  617. vi.mocked(getSystemSettings).mockResolvedValue(makeSystemSettings(options.billingModelSource));
  618. if (options.priceLookup === "none") {
  619. vi.mocked(findLatestPriceByModel).mockResolvedValue(null);
  620. } else {
  621. vi.mocked(findLatestPriceByModel).mockImplementation(async () => {
  622. throw new Error("db query failed");
  623. });
  624. }
  625. vi.mocked(updateMessageRequestDetails).mockResolvedValue(undefined);
  626. vi.mocked(updateMessageRequestDuration).mockResolvedValue(undefined);
  627. vi.mocked(SessionManager.storeSessionResponse).mockResolvedValue(undefined);
  628. vi.mocked(RateLimitService.trackUserDailyCost).mockResolvedValue(undefined);
  629. vi.mocked(SessionTracker.refreshSession).mockResolvedValue(undefined);
  630. vi.mocked(updateMessageRequestCost).mockResolvedValue(undefined);
  631. vi.mocked(RateLimitService.trackCost).mockResolvedValue(undefined);
  632. vi.mocked(SessionManager.updateSessionUsage).mockResolvedValue(undefined);
  633. const session = createSession({
  634. originalModel,
  635. redirectedModel,
  636. sessionId: `sess-no-price-${options.billingModelSource}-${options.isStream ? "s" : "n"}`,
  637. messageId: options.isStream ? 3001 : 3000,
  638. });
  639. const response = options.isStream
  640. ? createStreamResponse(usage)
  641. : createNonStreamResponse(usage);
  642. const clientResponse = await ProxyResponseHandler.dispatch(session, response);
  643. await clientResponse.text();
  644. await drainAsyncTasks();
  645. return {
  646. dbCostCalls: vi.mocked(updateMessageRequestCost).mock.calls.length,
  647. rateLimitCalls: vi.mocked(RateLimitService.trackCost).mock.calls.length,
  648. };
  649. }
  650. it("无价格:不写入 DB cost,不追踪限流 cost,并触发一次异步同步", async () => {
  651. const result = await runNoPriceScenario({
  652. billingModelSource: "redirected",
  653. isStream: false,
  654. priceLookup: "none",
  655. });
  656. expect(result.dbCostCalls).toBe(0);
  657. expect(result.rateLimitCalls).toBe(0);
  658. expect(cloudPriceSyncRequests).toEqual([{ reason: "missing-model" }]);
  659. });
  660. it("价格查询抛错:不应影响响应,不写入 DB cost,不追踪限流 cost", async () => {
  661. const result = await runNoPriceScenario({
  662. billingModelSource: "original",
  663. isStream: true,
  664. priceLookup: "throws",
  665. });
  666. expect(result.dbCostCalls).toBe(0);
  667. expect(result.rateLimitCalls).toBe(0);
  668. });
  669. });