| 12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154 |
- import { beforeEach, describe, expect, test, vi } from "vitest";
- import { resolveEndpointPolicy } from "@/app/v1/_lib/proxy/endpoint-policy";
- const mocks = vi.hoisted(() => ({
- pickRandomProviderWithExclusion: vi.fn(),
- recordSuccess: vi.fn(),
- recordFailure: vi.fn(async () => {}),
- getCircuitState: vi.fn(() => "closed"),
- getProviderHealthInfo: vi.fn(async () => ({
- health: { failureCount: 0 },
- config: { failureThreshold: 3 },
- })),
- updateSessionBindingSmart: vi.fn(async () => ({ updated: true, reason: "test" })),
- updateSessionProvider: vi.fn(async () => {}),
- clearSessionProvider: vi.fn(async () => {}),
- isHttp2Enabled: vi.fn(async () => false),
- getPreferredProviderEndpoints: vi.fn(async () => []),
- getEndpointFilterStats: vi.fn(async () => null),
- recordEndpointSuccess: vi.fn(async () => {}),
- recordEndpointFailure: vi.fn(async () => {}),
- isVendorTypeCircuitOpen: vi.fn(async () => false),
- recordVendorTypeAllEndpointsTimeout: vi.fn(async () => {}),
- categorizeErrorAsync: vi.fn(async () => 0),
- getCachedSystemSettings: vi.fn(async () => ({
- enableThinkingSignatureRectifier: true,
- enableThinkingBudgetRectifier: true,
- })),
- storeSessionSpecialSettings: vi.fn(async () => {}),
- }));
- vi.mock("@/lib/logger", () => ({
- logger: {
- debug: vi.fn(),
- info: vi.fn(),
- warn: vi.fn(),
- trace: vi.fn(),
- error: vi.fn(),
- fatal: vi.fn(),
- },
- }));
- vi.mock("@/lib/config", async (importOriginal) => {
- const actual = await importOriginal<typeof import("@/lib/config")>();
- return {
- ...actual,
- getCachedSystemSettings: mocks.getCachedSystemSettings,
- isHttp2Enabled: mocks.isHttp2Enabled,
- };
- });
- vi.mock("@/lib/provider-endpoints/endpoint-selector", () => ({
- getPreferredProviderEndpoints: mocks.getPreferredProviderEndpoints,
- getEndpointFilterStats: mocks.getEndpointFilterStats,
- }));
- vi.mock("@/lib/endpoint-circuit-breaker", () => ({
- recordEndpointSuccess: mocks.recordEndpointSuccess,
- recordEndpointFailure: mocks.recordEndpointFailure,
- }));
- vi.mock("@/lib/circuit-breaker", () => ({
- getCircuitState: mocks.getCircuitState,
- getProviderHealthInfo: mocks.getProviderHealthInfo,
- recordFailure: mocks.recordFailure,
- recordSuccess: mocks.recordSuccess,
- }));
- vi.mock("@/lib/vendor-type-circuit-breaker", () => ({
- isVendorTypeCircuitOpen: mocks.isVendorTypeCircuitOpen,
- recordVendorTypeAllEndpointsTimeout: mocks.recordVendorTypeAllEndpointsTimeout,
- }));
- vi.mock("@/lib/session-manager", () => ({
- SessionManager: {
- updateSessionBindingSmart: mocks.updateSessionBindingSmart,
- updateSessionProvider: mocks.updateSessionProvider,
- clearSessionProvider: mocks.clearSessionProvider,
- storeSessionSpecialSettings: mocks.storeSessionSpecialSettings,
- },
- }));
- vi.mock("@/app/v1/_lib/proxy/provider-selector", () => ({
- ProxyProviderResolver: {
- pickRandomProviderWithExclusion: mocks.pickRandomProviderWithExclusion,
- },
- }));
- vi.mock("@/app/v1/_lib/proxy/errors", async (importOriginal) => {
- const actual = await importOriginal<typeof import("@/app/v1/_lib/proxy/errors")>();
- return {
- ...actual,
- categorizeErrorAsync: mocks.categorizeErrorAsync,
- };
- });
- import {
- ErrorCategory as ProxyErrorCategory,
- ProxyError as UpstreamProxyError,
- } from "@/app/v1/_lib/proxy/errors";
- import { ProxyForwarder } from "@/app/v1/_lib/proxy/forwarder";
- import { ProxySession } from "@/app/v1/_lib/proxy/session";
- import type { Provider } from "@/types/provider";
- type AttemptRuntime = {
- clearResponseTimeout?: () => void;
- responseController?: AbortController;
- };
- function createProvider(overrides: Partial<Provider> = {}): Provider {
- return {
- id: 1,
- name: "p1",
- url: "https://provider.example.com",
- key: "k",
- providerVendorId: null,
- isEnabled: true,
- weight: 1,
- priority: 0,
- groupPriorities: null,
- costMultiplier: 1,
- groupTag: null,
- providerType: "claude",
- preserveClientIp: false,
- modelRedirects: null,
- allowedModels: null,
- mcpPassthroughType: "none",
- mcpPassthroughUrl: null,
- limit5hUsd: null,
- limitDailyUsd: null,
- dailyResetMode: "fixed",
- dailyResetTime: "00:00",
- limitWeeklyUsd: null,
- limitMonthlyUsd: null,
- limitTotalUsd: null,
- totalCostResetAt: null,
- limitConcurrentSessions: 0,
- maxRetryAttempts: 1,
- circuitBreakerFailureThreshold: 5,
- circuitBreakerOpenDuration: 1_800_000,
- circuitBreakerHalfOpenSuccessThreshold: 2,
- proxyUrl: null,
- proxyFallbackToDirect: false,
- firstByteTimeoutStreamingMs: 100,
- streamingIdleTimeoutMs: 0,
- requestTimeoutNonStreamingMs: 0,
- websiteUrl: null,
- faviconUrl: null,
- cacheTtlPreference: null,
- context1mPreference: null,
- codexReasoningEffortPreference: null,
- codexReasoningSummaryPreference: null,
- codexTextVerbosityPreference: null,
- codexParallelToolCallsPreference: null,
- codexServiceTierPreference: null,
- anthropicMaxTokensPreference: null,
- anthropicThinkingBudgetPreference: null,
- anthropicAdaptiveThinking: null,
- geminiGoogleSearchPreference: null,
- tpm: 0,
- rpm: 0,
- rpd: 0,
- cc: 0,
- createdAt: new Date(),
- updatedAt: new Date(),
- deletedAt: null,
- ...overrides,
- };
- }
- function createSession(clientAbortSignal: AbortSignal | null = null): ProxySession {
- const headers = new Headers();
- const session = Object.create(ProxySession.prototype);
- Object.assign(session, {
- startTime: Date.now(),
- method: "POST",
- requestUrl: new URL("https://example.com/v1/messages"),
- headers,
- originalHeaders: new Headers(headers),
- headerLog: JSON.stringify(Object.fromEntries(headers.entries())),
- request: {
- model: "claude-test",
- log: "(test)",
- message: {
- model: "claude-test",
- stream: true,
- messages: [{ role: "user", content: "hi" }],
- },
- },
- userAgent: null,
- context: null,
- clientAbortSignal,
- userName: "test-user",
- authState: { success: true, user: null, key: null, apiKey: null },
- provider: null,
- messageContext: null,
- sessionId: "sess-hedge",
- requestSequence: 1,
- originalFormat: "claude",
- providerType: null,
- originalModelName: null,
- originalUrlPathname: null,
- providerChain: [],
- cacheTtlResolved: null,
- context1mApplied: false,
- specialSettings: [],
- cachedPriceData: undefined,
- cachedBillingModelSource: undefined,
- endpointPolicy: resolveEndpointPolicy("/v1/messages"),
- isHeaderModified: () => false,
- });
- return session as ProxySession;
- }
- function createStreamingResponse(params: {
- label: string;
- firstChunkDelayMs: number;
- controller: AbortController;
- }): Response {
- const encoder = new TextEncoder();
- let timeoutId: ReturnType<typeof setTimeout> | null = null;
- const stream = new ReadableStream<Uint8Array>({
- start(controller) {
- const onAbort = () => {
- if (timeoutId) {
- clearTimeout(timeoutId);
- }
- controller.close();
- };
- if (params.controller.signal.aborted) {
- onAbort();
- return;
- }
- params.controller.signal.addEventListener("abort", onAbort, { once: true });
- timeoutId = setTimeout(() => {
- if (params.controller.signal.aborted) {
- controller.close();
- return;
- }
- controller.enqueue(encoder.encode(`data: {"provider":"${params.label}"}\n\n`));
- controller.close();
- }, params.firstChunkDelayMs);
- },
- });
- return new Response(stream, {
- status: 200,
- headers: { "content-type": "text/event-stream" },
- });
- }
- function createDelayedFailure(params: {
- delayMs: number;
- error: Error;
- controller: AbortController;
- }): Promise<Response> {
- return new Promise((_, reject) => {
- let timeoutId: ReturnType<typeof setTimeout> | null = null;
- const rejectWithError = () => {
- if (timeoutId) {
- clearTimeout(timeoutId);
- }
- reject(params.error);
- };
- if (params.controller.signal.aborted) {
- rejectWithError();
- return;
- }
- params.controller.signal.addEventListener("abort", rejectWithError, { once: true });
- timeoutId = setTimeout(() => {
- params.controller.signal.removeEventListener("abort", rejectWithError);
- reject(params.error);
- }, params.delayMs);
- });
- }
- function withThinkingBlocks(session: ProxySession): void {
- session.request.message = {
- model: "claude-test",
- stream: true,
- messages: [
- {
- role: "assistant",
- content: [
- { type: "thinking", thinking: "t", signature: "sig_thinking" },
- { type: "text", text: "hello", signature: "sig_text_should_remove" },
- { type: "redacted_thinking", data: "r", signature: "sig_redacted" },
- ],
- },
- ],
- };
- }
- describe("ProxyForwarder - first-byte hedge scheduling", () => {
- beforeEach(() => {
- vi.clearAllMocks();
- });
- test("first provider exceeds first-byte threshold, second provider starts and wins by first chunk", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 220,
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 40,
- controller: controller2,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- await vi.advanceTimersByTimeAsync(50);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p2"');
- expect(controller1.signal.aborted).toBe(true);
- expect(controller2.signal.aborted).toBe(false);
- expect(mocks.recordFailure).not.toHaveBeenCalled();
- expect(mocks.recordSuccess).not.toHaveBeenCalled();
- expect(session.provider?.id).toBe(2);
- expect(mocks.updateSessionBindingSmart).toHaveBeenCalledWith("sess-hedge", 2, 0, false, true);
- } finally {
- vi.useRealTimers();
- }
- });
- test("characterization: hedge still launches alternative provider when maxRetryAttempts > 1", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({
- id: 1,
- name: "p1",
- maxRetryAttempts: 3,
- firstByteTimeoutStreamingMs: 100,
- });
- const provider2 = createProvider({
- id: 2,
- name: "p2",
- maxRetryAttempts: 3,
- firstByteTimeoutStreamingMs: 100,
- });
- const session = createSession();
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 220,
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 40,
- controller: controller2,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- expect(mocks.pickRandomProviderWithExclusion).toHaveBeenCalledTimes(1);
- const chainBeforeWinner = session.getProviderChain();
- expect(chainBeforeWinner).toEqual(
- expect.arrayContaining([
- expect.objectContaining({ reason: "hedge_triggered", id: 1 }),
- expect.objectContaining({ reason: "hedge_launched", id: 2 }),
- ])
- );
- await vi.advanceTimersByTimeAsync(50);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p2"');
- expect(controller1.signal.aborted).toBe(true);
- expect(session.provider?.id).toBe(2);
- } finally {
- vi.useRealTimers();
- }
- });
- test("first provider can still win after hedge started if it emits first chunk earlier than fallback", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 140,
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 120,
- controller: controller2,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- await vi.advanceTimersByTimeAsync(45);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p1"');
- expect(controller1.signal.aborted).toBe(false);
- expect(controller2.signal.aborted).toBe(true);
- expect(mocks.recordFailure).not.toHaveBeenCalled();
- expect(mocks.recordSuccess).not.toHaveBeenCalled();
- expect(session.provider?.id).toBe(1);
- } finally {
- vi.useRealTimers();
- }
- });
- test("when multiple providers all exceed threshold, hedge scheduler keeps expanding until a later provider wins", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const provider3 = createProvider({ id: 3, name: "p3", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion
- .mockResolvedValueOnce(provider2)
- .mockResolvedValueOnce(provider3);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2 = new AbortController();
- const controller3 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 400,
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 400,
- controller: controller2,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller3;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p3",
- firstChunkDelayMs: 20,
- controller: controller3,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(200);
- expect(doForward).toHaveBeenCalledTimes(3);
- await vi.advanceTimersByTimeAsync(25);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p3"');
- expect(controller1.signal.aborted).toBe(true);
- expect(controller2.signal.aborted).toBe(true);
- expect(controller3.signal.aborted).toBe(false);
- expect(mocks.recordFailure).not.toHaveBeenCalled();
- expect(mocks.recordSuccess).not.toHaveBeenCalled();
- expect(session.provider?.id).toBe(3);
- } finally {
- vi.useRealTimers();
- }
- });
- test("client abort before any winner should abort all in-flight attempts, return 499, and clear sticky provider binding", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const clientAbortController = new AbortController();
- const session = createSession(clientAbortController.signal);
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 500,
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 500,
- controller: controller2,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- const rejection = expect(responsePromise).rejects.toMatchObject({
- statusCode: 499,
- });
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- clientAbortController.abort(new Error("client_cancelled"));
- await vi.runAllTimersAsync();
- await rejection;
- expect(controller1.signal.aborted).toBe(true);
- expect(controller2.signal.aborted).toBe(true);
- expect(mocks.clearSessionProvider).toHaveBeenCalledWith("sess-hedge");
- expect(mocks.recordFailure).not.toHaveBeenCalled();
- expect(mocks.recordSuccess).not.toHaveBeenCalled();
- } finally {
- vi.useRealTimers();
- }
- });
- test("hedge launcher rejection should settle request instead of hanging", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion.mockRejectedValueOnce(new Error("selector down"));
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 500,
- controller: controller1,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- const rejection = expect(responsePromise).rejects.toMatchObject({
- statusCode: 503,
- });
- await vi.advanceTimersByTimeAsync(100);
- await vi.runAllTimersAsync();
- await rejection;
- expect(controller1.signal.aborted).toBe(true);
- } finally {
- vi.useRealTimers();
- }
- });
- test("strict endpoint pool exhaustion should converge to terminal fallback instead of provider-specific error", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({
- id: 1,
- name: "p1",
- providerType: "claude",
- providerVendorId: 123,
- firstByteTimeoutStreamingMs: 100,
- });
- const session = createSession();
- session.requestUrl = new URL("https://example.com/v1/messages");
- session.setProvider(provider1);
- mocks.getPreferredProviderEndpoints.mockRejectedValueOnce(new Error("Redis connection lost"));
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(null);
- const responsePromise = ProxyForwarder.send(session);
- const errorPromise = responsePromise.catch((rejection) => rejection as UpstreamProxyError);
- await vi.runAllTimersAsync();
- const error = await errorPromise;
- expect(mocks.pickRandomProviderWithExclusion).toHaveBeenCalled();
- expect(error).toBeInstanceOf(UpstreamProxyError);
- expect(error.statusCode).toBe(503);
- expect(error.message).toBe("所有供应商暂时不可用,请稍后重试");
- } finally {
- vi.useRealTimers();
- }
- });
- test.each([
- {
- name: "provider error",
- category: ProxyErrorCategory.PROVIDER_ERROR,
- errorFactory: (provider: Provider) =>
- new UpstreamProxyError("Provider returned 401: invalid key", 401, {
- body: '{"error":"invalid_api_key"}',
- providerId: provider.id,
- providerName: provider.name,
- }),
- },
- {
- name: "resource not found",
- category: ProxyErrorCategory.RESOURCE_NOT_FOUND,
- errorFactory: (provider: Provider) =>
- new UpstreamProxyError("Provider returned 404: model not found", 404, {
- body: '{"error":"model_not_found"}',
- providerId: provider.id,
- providerName: provider.name,
- }),
- },
- {
- name: "system error",
- category: ProxyErrorCategory.SYSTEM_ERROR,
- errorFactory: () => new Error("fetch failed"),
- },
- ])("when a real hedge race ends with only $name, terminal error should be generic fallback", async ({
- category,
- errorFactory,
- }) => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- mocks.pickRandomProviderWithExclusion
- .mockResolvedValueOnce(provider2)
- .mockResolvedValueOnce(null);
- mocks.categorizeErrorAsync.mockResolvedValueOnce(category).mockResolvedValueOnce(category);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createDelayedFailure({
- delayMs: 150,
- error: errorFactory(provider1),
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createDelayedFailure({
- delayMs: 160,
- error: errorFactory(provider2),
- controller: controller2,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- const errorPromise = responsePromise.catch((rejection) => rejection as UpstreamProxyError);
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- await vi.runAllTimersAsync();
- const error = await errorPromise;
- expect(error).toBeInstanceOf(UpstreamProxyError);
- expect(error.statusCode).toBe(503);
- expect(error.message).toBe("所有供应商暂时不可用,请稍后重试");
- expect(error.message).not.toContain("invalid key");
- expect(error.message).not.toContain("model not found");
- expect(mocks.clearSessionProvider).toHaveBeenCalledWith("sess-hedge");
- } finally {
- vi.useRealTimers();
- }
- });
- test("non-retryable client errors should stop hedge immediately and preserve original error", async () => {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- const originalError = new UpstreamProxyError("prompt too long", 400, {
- body: '{"error":"prompt_too_long"}',
- providerId: provider1.id,
- providerName: provider1.name,
- });
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- mocks.categorizeErrorAsync.mockResolvedValueOnce(ProxyErrorCategory.NON_RETRYABLE_CLIENT_ERROR);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- doForward.mockRejectedValueOnce(originalError);
- const error = await ProxyForwarder.send(session).catch(
- (rejection) => rejection as UpstreamProxyError
- );
- expect(error).toBe(originalError);
- expect(error.message).toBe("prompt too long");
- expect(doForward).toHaveBeenCalledTimes(1);
- expect(mocks.pickRandomProviderWithExclusion).not.toHaveBeenCalled();
- expect(mocks.clearSessionProvider).toHaveBeenCalledWith("sess-hedge");
- expect(session.getProviderChain()).toEqual(
- expect.arrayContaining([
- expect.objectContaining({
- reason: "client_error_non_retryable",
- statusCode: 400,
- }),
- ])
- );
- });
- test("hedge 备选供应商命中 thinking signature 错误时,应整流后在同供应商重试并保留审计", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- withThinkingBlocks(session);
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- mocks.categorizeErrorAsync.mockResolvedValue(ProxyErrorCategory.NON_RETRYABLE_CLIENT_ERROR);
- const signatureError = new UpstreamProxyError(
- "Invalid `signature` in `thinking` block",
- 400,
- {
- body: '{"error":"invalid_signature"}',
- providerId: provider2.id,
- providerName: provider2.name,
- }
- );
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1 = new AbortController();
- const controller2First = new AbortController();
- const controller2Retry = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1",
- firstChunkDelayMs: 600,
- controller: controller1,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2First;
- runtime.clearResponseTimeout = vi.fn();
- return createDelayedFailure({
- delayMs: 50,
- error: signatureError,
- controller: controller2First,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- const body = runtime.request.message as {
- messages: Array<{ content: Array<Record<string, unknown>> }>;
- };
- const blocks = body.messages[0].content;
- expect(blocks.some((block) => block.type === "thinking")).toBe(false);
- expect(blocks.some((block) => block.type === "redacted_thinking")).toBe(false);
- expect(blocks.some((block) => "signature" in block)).toBe(false);
- runtime.responseController = controller2Retry;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2-rectified",
- firstChunkDelayMs: 180,
- controller: controller2Retry,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- await vi.advanceTimersByTimeAsync(55);
- expect(doForward).toHaveBeenCalledTimes(3);
- await vi.advanceTimersByTimeAsync(200);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p2-rectified"');
- expect(session.provider?.id).toBe(2);
- expect(controller1.signal.aborted).toBe(true);
- expect(mocks.pickRandomProviderWithExclusion).toHaveBeenCalled();
- expect(mocks.storeSessionSpecialSettings).toHaveBeenCalledWith(
- "sess-hedge",
- expect.arrayContaining([
- expect.objectContaining({
- type: "thinking_signature_rectifier",
- hit: true,
- providerId: 2,
- }),
- ]),
- 1
- );
- } finally {
- vi.useRealTimers();
- }
- });
- test("hedge 路径命中 thinking budget 错误时,应整流后在同供应商重试", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({ id: 1, name: "p1", firstByteTimeoutStreamingMs: 100 });
- const provider2 = createProvider({ id: 2, name: "p2", firstByteTimeoutStreamingMs: 100 });
- const session = createSession();
- session.setProvider(provider1);
- session.request.message = {
- model: "claude-test",
- stream: true,
- max_tokens: 1000,
- thinking: { type: "enabled", budget_tokens: 500 },
- messages: [{ role: "user", content: "hi" }],
- };
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- mocks.categorizeErrorAsync.mockResolvedValue(ProxyErrorCategory.NON_RETRYABLE_CLIENT_ERROR);
- const budgetError = new UpstreamProxyError(
- "thinking.enabled.budget_tokens: Input should be greater than or equal to 1024",
- 400,
- {
- body: '{"error":"budget_too_low"}',
- providerId: provider1.id,
- providerName: provider1.name,
- }
- );
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller1First = new AbortController();
- const controller1Retry = new AbortController();
- const controller2 = new AbortController();
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller1First;
- runtime.clearResponseTimeout = vi.fn();
- return createDelayedFailure({
- delayMs: 140,
- error: budgetError,
- controller: controller1First,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 500,
- controller: controller2,
- });
- });
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- const body = runtime.request.message as {
- max_tokens: number;
- thinking: { type: string; budget_tokens: number };
- };
- expect(body.max_tokens).toBe(64000);
- expect(body.thinking.type).toBe("enabled");
- expect(body.thinking.budget_tokens).toBe(32000);
- runtime.responseController = controller1Retry;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p1-budget-rectified",
- firstChunkDelayMs: 40,
- controller: controller1Retry,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(100);
- expect(doForward).toHaveBeenCalledTimes(2);
- await vi.advanceTimersByTimeAsync(45);
- expect(doForward).toHaveBeenCalledTimes(3);
- await vi.advanceTimersByTimeAsync(50);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p1-budget-rectified"');
- expect(session.provider?.id).toBe(1);
- expect(mocks.pickRandomProviderWithExclusion).toHaveBeenCalledTimes(1);
- expect(session.getSpecialSettings()).toEqual(
- expect.arrayContaining([
- expect.objectContaining({
- type: "thinking_budget_rectifier",
- hit: true,
- providerId: 1,
- }),
- ])
- );
- } finally {
- vi.useRealTimers();
- }
- });
- test("endpoint resolution failure should not inflate launchedProviderCount, winner gets request_success not hedge_winner", async () => {
- vi.useFakeTimers();
- try {
- const provider1 = createProvider({
- id: 1,
- name: "p1",
- providerVendorId: 123,
- firstByteTimeoutStreamingMs: 100,
- });
- const provider2 = createProvider({
- id: 2,
- name: "p2",
- providerVendorId: null,
- firstByteTimeoutStreamingMs: 100,
- });
- const session = createSession();
- session.requestUrl = new URL("https://example.com/v1/messages");
- session.setProvider(provider1);
- // Provider 1's strict endpoint resolution will fail
- mocks.getPreferredProviderEndpoints.mockRejectedValueOnce(
- new Error("Endpoint resolution failed")
- );
- // After provider 1 fails, pick provider 2 as alternative
- mocks.pickRandomProviderWithExclusion.mockResolvedValueOnce(provider2);
- const doForward = vi.spyOn(
- ProxyForwarder as unknown as {
- doForward: (...args: unknown[]) => Promise<Response>;
- },
- "doForward"
- );
- const controller2 = new AbortController();
- // Only provider 2 reaches doForward (provider 1 fails at endpoint resolution)
- doForward.mockImplementationOnce(async (attemptSession) => {
- const runtime = attemptSession as ProxySession & AttemptRuntime;
- runtime.responseController = controller2;
- runtime.clearResponseTimeout = vi.fn();
- return createStreamingResponse({
- label: "p2",
- firstChunkDelayMs: 10,
- controller: controller2,
- });
- });
- const responsePromise = ProxyForwarder.send(session);
- await vi.advanceTimersByTimeAsync(200);
- const response = await responsePromise;
- expect(await response.text()).toContain('"provider":"p2"');
- expect(session.provider?.id).toBe(2);
- // Key assertion: since only provider 2 actually launched (provider 1 failed at
- // endpoint resolution before incrementing launchedProviderCount), the winner
- // should be classified as "request_success" not "hedge_winner".
- const chain = session.getProviderChain();
- const winnerEntry = chain.find(
- (entry) => entry.reason === "request_success" || entry.reason === "hedge_winner"
- );
- expect(winnerEntry).toBeDefined();
- expect(winnerEntry!.reason).toBe("request_success");
- } finally {
- vi.useRealTimers();
- }
- });
- });
|