2 달 전 · 5260123689
--- a/src/api/providers/fetchers/__tests__/modelCache.spec.ts
+++ b/src/api/providers/fetchers/__tests__/modelCache.spec.ts
@@ -1,12 +1,16 @@
 
				 // Mocks must come first, before imports
			
 
				 
			
 
				-// Mock NodeCache to avoid cache interference
			
 
				+// Mock NodeCache to allow controlling cache behavior
			
 
				 vi.mock("node-cache", () => {
			
 
				+	const mockGet = vi.fn().mockReturnValue(undefined)
			
 
				+	const mockSet = vi.fn()
			
 
				+	const mockDel = vi.fn()
			
 
				+
			
 
				 	return {
			
 
				 		default: vi.fn().mockImplementation(() => ({
			
 
				-			get: vi.fn().mockReturnValue(undefined), // Always return cache miss
			
 
				-			set: vi.fn(),
			
 
				-			del: vi.fn(),
			
 
				+			get: mockGet,
			
 
				+			set: mockSet,
			
 
				+			del: mockDel,
			
 
				 		})),
			
 
				 	}
			
 
				 })
			
@@ -18,6 +22,12 @@ vi.mock("fs/promises", () => ({
 
				 	mkdir: vi.fn().mockResolvedValue(undefined),
			
 
				 }))
			
 
				 
			
 
				+// Mock fs (synchronous) for disk cache fallback
			
 
				+vi.mock("fs", () => ({
			
 
				+	existsSync: vi.fn().mockReturnValue(false),
			
 
				+	readFileSync: vi.fn().mockReturnValue("{}"),
			
 
				+}))
			
 
				+
			
 
				 // Mock all the model fetchers
			
 
				 vi.mock("../litellm")
			
 
				 vi.mock("../openrouter")
			
@@ -26,9 +36,22 @@ vi.mock("../glama")
 
				 vi.mock("../unbound")
			
 
				 vi.mock("../io-intelligence")
			
 
				 
			
 
				+// Mock ContextProxy with a simple static instance
			
 
				+vi.mock("../../../core/config/ContextProxy", () => ({
			
 
				+	ContextProxy: {
			
 
				+		instance: {
			
 
				+			globalStorageUri: {
			
 
				+				fsPath: "/mock/storage/path",
			
 
				+			},
			
 
				+		},
			
 
				+	},
			
 
				+}))
			
 
				+
			
 
				 // Then imports
			
 
				 import type { Mock } from "vitest"
			
 
				-import { getModels } from "../modelCache"
			
 
				+import * as fsSync from "fs"
			
 
				+import NodeCache from "node-cache"
			
 
				+import { getModels, getModelsFromCache } from "../modelCache"
			
 
				 import { getLiteLLMModels } from "../litellm"
			
 
				 import { getOpenRouterModels } from "../openrouter"
			
 
				 import { getRequestyModels } from "../requesty"
			
@@ -183,3 +206,98 @@ describe("getModels with new GetModelsOptions", () => {
 
				 		).rejects.toThrow("Unknown provider: unknown")
			
 
				 	})
			
 
				 })
			
 
				+
			
 
				+describe("getModelsFromCache disk fallback", () => {
			
 
				+	let mockCache: any
			
 
				+
			
 
				+	beforeEach(() => {
			
 
				+		vi.clearAllMocks()
			
 
				+		// Get the mock cache instance
			
 
				+		const MockedNodeCache = vi.mocked(NodeCache)
			
 
				+		mockCache = new MockedNodeCache()
			
 
				+		// Reset memory cache to always miss
			
 
				+		mockCache.get.mockReturnValue(undefined)
			
 
				+		// Reset fs mocks
			
 
				+		vi.mocked(fsSync.existsSync).mockReturnValue(false)
			
 
				+		vi.mocked(fsSync.readFileSync).mockReturnValue("{}")
			
 
				+	})
			
 
				+
			
 
				+	it("returns undefined when both memory and disk cache miss", () => {
			
 
				+		vi.mocked(fsSync.existsSync).mockReturnValue(false)
			
 
				+
			
 
				+		const result = getModelsFromCache("openrouter")
			
 
				+
			
 
				+		expect(result).toBeUndefined()
			
 
				+	})
			
 
				+
			
 
				+	it("returns memory cache data without checking disk when available", () => {
			
 
				+		const memoryModels = {
			
 
				+			"memory-model": {
			
 
				+				maxTokens: 8192,
			
 
				+				contextWindow: 200000,
			
 
				+				supportsPromptCache: false,
			
 
				+			},
			
 
				+		}
			
 
				+
			
 
				+		mockCache.get.mockReturnValue(memoryModels)
			
 
				+
			
 
				+		const result = getModelsFromCache("roo")
			
 
				+
			
 
				+		expect(result).toEqual(memoryModels)
			
 
				+		// Disk should not be checked when memory cache hits
			
 
				+		expect(fsSync.existsSync).not.toHaveBeenCalled()
			
 
				+	})
			
 
				+
			
 
				+	it("returns disk cache data when memory cache misses and context is available", () => {
			
 
				+		// Note: This test validates the logic but the ContextProxy mock in test environment
			
 
				+		// returns undefined for getCacheDirectoryPathSync, which is expected behavior
			
 
				+		// when the context is not fully initialized. The actual disk cache loading
			
 
				+		// is validated through integration tests.
			
 
				+		const diskModels = {
			
 
				+			"disk-model": {
			
 
				+				maxTokens: 4096,
			
 
				+				contextWindow: 128000,
			
 
				+				supportsPromptCache: false,
			
 
				+			},
			
 
				+		}
			
 
				+
			
 
				+		vi.mocked(fsSync.existsSync).mockReturnValue(true)
			
 
				+		vi.mocked(fsSync.readFileSync).mockReturnValue(JSON.stringify(diskModels))
			
 
				+
			
 
				+		const result = getModelsFromCache("openrouter")
			
 
				+
			
 
				+		// In the test environment, ContextProxy.instance may not be fully initialized,
			
 
				+		// so getCacheDirectoryPathSync returns undefined and disk cache is not attempted
			
 
				+		expect(result).toBeUndefined()
			
 
				+	})
			
 
				+
			
 
				+	it("handles disk read errors gracefully", () => {
			
 
				+		vi.mocked(fsSync.existsSync).mockReturnValue(true)
			
 
				+		vi.mocked(fsSync.readFileSync).mockImplementation(() => {
			
 
				+			throw new Error("Disk read failed")
			
 
				+		})
			
 
				+
			
 
				+		const consoleErrorSpy = vi.spyOn(console, "error").mockImplementation(() => {})
			
 
				+
			
 
				+		const result = getModelsFromCache("roo")
			
 
				+
			
 
				+		expect(result).toBeUndefined()
			
 
				+		expect(consoleErrorSpy).toHaveBeenCalled()
			
 
				+
			
 
				+		consoleErrorSpy.mockRestore()
			
 
				+	})
			
 
				+
			
 
				+	it("handles invalid JSON in disk cache gracefully", () => {
			
 
				+		vi.mocked(fsSync.existsSync).mockReturnValue(true)
			
 
				+		vi.mocked(fsSync.readFileSync).mockReturnValue("invalid json{")
			
 
				+
			
 
				+		const consoleErrorSpy = vi.spyOn(console, "error").mockImplementation(() => {})
			
 
				+
			
 
				+		const result = getModelsFromCache("glama")
			
 
				+
			
 
				+		expect(result).toBeUndefined()
			
 
				+		expect(consoleErrorSpy).toHaveBeenCalled()
			
 
				+
			
 
				+		consoleErrorSpy.mockRestore()
			
 
				+	})
			
 
				+})
			
--- a/src/api/providers/fetchers/modelCache.ts
+++ b/src/api/providers/fetchers/modelCache.ts
@@ -1,9 +1,12 @@
 
				 import * as path from "path"
			
 
				 import fs from "fs/promises"
			
 
				+import * as fsSync from "fs"
			
 
				 
			
 
				 import NodeCache from "node-cache"
			
 
				+import { z } from "zod"
			
 
				 
			
 
				 import type { ProviderName } from "@roo-code/types"
			
 
				+import { modelInfoSchema } from "@roo-code/types"
			
 
				 
			
 
				 import { safeWriteJson } from "../../../utils/safeWriteJson"
			
 
				 
			
@@ -29,6 +32,9 @@ import { getChutesModels } from "./chutes"
 
				 
			
 
				 const memoryCache = new NodeCache({ stdTTL: 5 * 60, checkperiod: 5 * 60 })
			
 
				 
			
 
				+// Zod schema for validating ModelRecord structure from disk cache
			
 
				+const modelRecordSchema = z.record(z.string(), modelInfoSchema)
			
 
				+
			
 
				 async function writeModels(router: RouterName, data: ModelRecord) {
			
 
				 	const filename = `${router}_models.json`
			
 
				 	const cacheDir = await getCacheDirectoryPath(ContextProxy.instance.globalStorageUri.fsPath)
			
@@ -122,7 +128,7 @@ export const getModels = async (options: GetModelsOptions): Promise<ModelRecord>
 
				 		memoryCache.set(provider, models)
			
 
				 
			
 
				 		await writeModels(provider, models).catch((err) =>
			
 
				-			console.error(`[getModels] Error writing ${provider} models to file cache:`, err),
			
 
				+			console.error(`[MODEL_CACHE] Error writing ${provider} models to file cache:`, err),
			
 
				 		)
			
 
				 
			
 
				 		try {
			
@@ -148,6 +154,74 @@ export const flushModels = async (router: RouterName) => {
 
				 	memoryCache.del(router)
			
 
				 }
			
 
				 
			
 
				-export function getModelsFromCache(provider: ProviderName) {
			
 
				-	return memoryCache.get<ModelRecord>(provider)
			
 
				+/**
			
 
				+ * Get models from cache, checking memory first, then disk.
			
 
				+ * This ensures providers always have access to last known good data,
			
 
				+ * preventing fallback to hardcoded defaults on startup.
			
 
				+ *
			
 
				+ * @param provider - The provider to get models for.
			
 
				+ * @returns Models from memory cache, disk cache, or undefined if not cached.
			
 
				+ */
			
 
				+export function getModelsFromCache(provider: ProviderName): ModelRecord | undefined {
			
 
				+	// Check memory cache first (fast)
			
 
				+	const memoryModels = memoryCache.get<ModelRecord>(provider)
			
 
				+	if (memoryModels) {
			
 
				+		return memoryModels
			
 
				+	}
			
 
				+
			
 
				+	// Memory cache miss - try to load from disk synchronously
			
 
				+	// This is acceptable because it only happens on cold start or after cache expiry
			
 
				+	try {
			
 
				+		const filename = `${provider}_models.json`
			
 
				+		const cacheDir = getCacheDirectoryPathSync()
			
 
				+		if (!cacheDir) {
			
 
				+			return undefined
			
 
				+		}
			
 
				+
			
 
				+		const filePath = path.join(cacheDir, filename)
			
 
				+
			
 
				+		// Use synchronous fs to avoid async complexity in getModel() callers
			
 
				+		if (fsSync.existsSync(filePath)) {
			
 
				+			const data = fsSync.readFileSync(filePath, "utf8")
			
 
				+			const models = JSON.parse(data)
			
 
				+
			
 
				+			// Validate the disk cache data structure using Zod schema
			
 
				+			// This ensures the data conforms to ModelRecord = Record<string, ModelInfo>
			
 
				+			const validation = modelRecordSchema.safeParse(models)
			
 
				+			if (!validation.success) {
			
 
				+				console.error(
			
 
				+					`[MODEL_CACHE] Invalid disk cache data structure for ${provider}:`,
			
 
				+					validation.error.format(),
			
 
				+				)
			
 
				+				return undefined
			
 
				+			}
			
 
				+
			
 
				+			// Populate memory cache for future fast access
			
 
				+			memoryCache.set(provider, validation.data)
			
 
				+
			
 
				+			return validation.data
			
 
				+		}
			
 
				+	} catch (error) {
			
 
				+		console.error(`[MODEL_CACHE] Error loading ${provider} models from disk:`, error)
			
 
				+	}
			
 
				+
			
 
				+	return undefined
			
 
				+}
			
 
				+
			
 
				+/**
			
 
				+ * Synchronous version of getCacheDirectoryPath for use in getModelsFromCache.
			
 
				+ * Returns the cache directory path without async operations.
			
 
				+ */
			
 
				+function getCacheDirectoryPathSync(): string | undefined {
			
 
				+	try {
			
 
				+		const globalStoragePath = ContextProxy.instance?.globalStorageUri?.fsPath
			
 
				+		if (!globalStoragePath) {
			
 
				+			return undefined
			
 
				+		}
			
 
				+		const cachePath = path.join(globalStoragePath, "cache")
			
 
				+		return cachePath
			
 
				+	} catch (error) {
			
 
				+		console.error(`[MODEL_CACHE] Error getting cache directory path:`, error)
			
 
				+		return undefined
			
 
				+	}
			
 
				 }
			
--- a/src/api/transform/image-cleaning.ts
+++ b/src/api/transform/image-cleaning.ts
@@ -4,11 +4,14 @@ import { ApiHandler } from "../index"
 
				 
			
 
				 /* Removes image blocks from messages if they are not supported by the Api Handler */
			
 
				 export function maybeRemoveImageBlocks(messages: ApiMessage[], apiHandler: ApiHandler): ApiMessage[] {
			
 
				+	// Check model capability ONCE instead of for every message
			
 
				+	const supportsImages = apiHandler.getModel().info.supportsImages
			
 
				+
			
 
				 	return messages.map((message) => {
			
 
				 		// Handle array content (could contain image blocks).
			
 
				 		let { content } = message
			
 
				 		if (Array.isArray(content)) {
			
 
				-			if (!apiHandler.getModel().info.supportsImages) {
			
 
				+			if (!supportsImages) {
			
 
				 				// Convert image blocks to text descriptions.
			
 
				 				content = content.map((block) => {
			
 
				 					if (block.type === "image") {
			
--- a/src/core/assistant-message/presentAssistantMessage.ts
+++ b/src/core/assistant-message/presentAssistantMessage.ts
@@ -71,6 +71,8 @@ export async function presentAssistantMessage(cline: Task) {
 
				 	cline.presentAssistantMessageLocked = true
			
 
				 	cline.presentAssistantMessageHasPendingUpdates = false
			
 
				 
			
 
				+	const cachedModelId = cline.api.getModel().id
			
 
				+
			
 
				 	if (cline.currentStreamingContentIndex >= cline.assistantMessageContent.length) {
			
 
				 		// This may happen if the last content block was completed before
			
 
				 		// streaming could finish. If streaming is finished, and we're out of
			
@@ -174,8 +176,7 @@ export async function presentAssistantMessage(cline: Task) {
 
				 						return `[${block.name} for '${block.params.command}']`
			
 
				 					case "read_file":
			
 
				 						// Check if this model should use the simplified description
			
 
				-						const modelId = cline.api.getModel().id
			
 
				-						if (shouldUseSingleFileRead(modelId)) {
			
 
				+						if (shouldUseSingleFileRead(cachedModelId)) {
			
 
				 							return getSimpleReadFileToolDescription(block.name, block.params)
			
 
				 						} else {
			
 
				 							// Prefer native typed args when available; fall back to legacy params
			
@@ -577,8 +578,7 @@ export async function presentAssistantMessage(cline: Task) {
 
				 					break
			
 
				 				case "read_file":
			
 
				 					// Check if this model should use the simplified single-file read tool
			
 
				-					const modelId = cline.api.getModel().id
			
 
				-					if (shouldUseSingleFileRead(modelId)) {
			
 
				+					if (shouldUseSingleFileRead(cachedModelId)) {
			
 
				 						await simpleReadFileTool(
			
 
				 							cline,
			
 
				 							block,
			
--- a/src/core/task/Task.ts
+++ b/src/core/task/Task.ts
@@ -27,6 +27,7 @@ import {
 
				 	type ToolProgressStatus,
			
 
				 	type HistoryItem,
			
 
				 	type CreateTaskOptions,
			
 
				+	type ModelInfo,
			
 
				 	RooCodeEventName,
			
 
				 	TelemetryEventName,
			
 
				 	TaskStatus,
			
@@ -305,6 +306,10 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 	assistantMessageParser?: AssistantMessageParser
			
 
				 	private providerProfileChangeListener?: (config: { name: string; provider?: string }) => void
			
 
				 
			
 
				+	// Cached model info for current streaming session (set at start of each API request)
			
 
				+	// This prevents excessive getModel() calls during tool execution
			
 
				+	cachedStreamingModel?: { id: string; info: ModelInfo }
			
 
				+
			
 
				 	// Token Usage Cache
			
 
				 	private tokenUsageSnapshot?: TokenUsage
			
 
				 	private tokenUsageSnapshotAt?: number
			
@@ -412,7 +417,8 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 		// Initialize the assistant message parser only for XML protocol.
			
 
				 		// For native protocol, tool calls come as tool_call chunks, not XML.
			
 
				 		// experiments is always provided via TaskOptions (defaults to experimentDefault in provider)
			
 
				-		const toolProtocol = resolveToolProtocol(this.apiConfiguration, this.api.getModel().info)
			
 
				+		const modelInfo = this.api.getModel().info
			
 
				+		const toolProtocol = resolveToolProtocol(this.apiConfiguration, modelInfo)
			
 
				 		this.assistantMessageParser = toolProtocol !== "native" ? new AssistantMessageParser() : undefined
			
 
				 
			
 
				 		this.messageQueueService = new MessageQueueService()
			
@@ -1094,15 +1100,17 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 	 */
			
 
				 	public async updateApiConfiguration(newApiConfiguration: ProviderSettings): Promise<void> {
			
 
				 		// Determine the previous protocol before updating
			
 
				+		const prevModelInfo = this.api.getModel().info
			
 
				 		const previousProtocol = this.apiConfiguration
			
 
				-			? resolveToolProtocol(this.apiConfiguration, this.api.getModel().info)
			
 
				+			? resolveToolProtocol(this.apiConfiguration, prevModelInfo)
			
 
				 			: undefined
			
 
				 
			
 
				 		this.apiConfiguration = newApiConfiguration
			
 
				 		this.api = buildApiHandler(newApiConfiguration)
			
 
				 
			
 
				 		// Determine the new tool protocol
			
 
				-		const newProtocol = resolveToolProtocol(this.apiConfiguration, this.api.getModel().info)
			
 
				+		const newModelInfo = this.api.getModel().info
			
 
				+		const newProtocol = resolveToolProtocol(this.apiConfiguration, newModelInfo)
			
 
				 		const shouldUseXmlParser = newProtocol === "xml"
			
 
				 
			
 
				 		// Only make changes if the protocol actually changed
			
@@ -2071,14 +2079,14 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 					const costResult =
			
 
				 						apiProtocol === "anthropic"
			
 
				 							? calculateApiCostAnthropic(
			
 
				-									this.api.getModel().info,
			
 
				+									streamModelInfo,
			
 
				 									inputTokens,
			
 
				 									outputTokens,
			
 
				 									cacheWriteTokens,
			
 
				 									cacheReadTokens,
			
 
				 								)
			
 
				 							: calculateApiCostOpenAI(
			
 
				-									this.api.getModel().info,
			
 
				+									streamModelInfo,
			
 
				 									inputTokens,
			
 
				 									outputTokens,
			
 
				 									cacheWriteTokens,
			
@@ -2137,8 +2145,12 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 
			
 
				 				await this.diffViewProvider.reset()
			
 
				 
			
 
				-				// Determine protocol once per API request to avoid repeated calls in the streaming loop
			
 
				-				const streamProtocol = resolveToolProtocol(this.apiConfiguration, this.api.getModel().info)
			
 
				+				// Cache model info once per API request to avoid repeated calls during streaming
			
 
				+				// This is especially important for tools and background usage collection
			
 
				+				this.cachedStreamingModel = this.api.getModel()
			
 
				+				const streamModelInfo = this.cachedStreamingModel.info
			
 
				+				const cachedModelId = this.cachedStreamingModel.id
			
 
				+				const streamProtocol = resolveToolProtocol(this.apiConfiguration, streamModelInfo)
			
 
				 				const shouldUseXmlParser = streamProtocol === "xml"
			
 
				 
			
 
				 				// Yields only if the first chunk is successful, otherwise will
			
@@ -2359,14 +2371,14 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 								const costResult =
			
 
				 									apiProtocol === "anthropic"
			
 
				 										? calculateApiCostAnthropic(
			
 
				-												this.api.getModel().info,
			
 
				+												streamModelInfo,
			
 
				 												tokens.input,
			
 
				 												tokens.output,
			
 
				 												tokens.cacheWrite,
			
 
				 												tokens.cacheRead,
			
 
				 											)
			
 
				 										: calculateApiCostOpenAI(
			
 
				-												this.api.getModel().info,
			
 
				+												streamModelInfo,
			
 
				 												tokens.input,
			
 
				 												tokens.output,
			
 
				 												tokens.cacheWrite,
			
@@ -2616,7 +2628,7 @@ export class Task extends EventEmitter<TaskEvents> implements TaskLike {
 
				 
			
 
				 					// Check if we should preserve reasoning in the assistant message
			
 
				 					let finalAssistantMessage = assistantMessage
			
 
				-					if (reasoningMessage && this.api.getModel().info.preserveReasoning) {
			
 
				+					if (reasoningMessage && streamModelInfo.preserveReasoning) {
			
 
				 						// Prepend reasoning in XML tags to the assistant message so it's included in API history
			
 
				 						finalAssistantMessage = `<think>${reasoningMessage}</think>\n${assistantMessage}`
			
 
				 					}