|
|
@@ -3387,6 +3387,33 @@
|
|
|
],
|
|
|
"source": "https://devblogs.microsoft.com/foundry/whats-new-in-azure-ai-foundry-august-2025/#mistral-document-ai-(ocr)-%E2%80%94-serverless-in-foundry"
|
|
|
},
|
|
|
+ "azure_ai/doc-intelligence/prebuilt-read": {
|
|
|
+ "litellm_provider": "azure_ai",
|
|
|
+ "ocr_cost_per_page": 1.5e-3,
|
|
|
+ "mode": "ocr",
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/ocr"
|
|
|
+ ],
|
|
|
+ "source": "https://azure.microsoft.com/en-us/pricing/details/ai-document-intelligence/"
|
|
|
+ },
|
|
|
+ "azure_ai/doc-intelligence/prebuilt-layout": {
|
|
|
+ "litellm_provider": "azure_ai",
|
|
|
+ "ocr_cost_per_page": 1e-2,
|
|
|
+ "mode": "ocr",
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/ocr"
|
|
|
+ ],
|
|
|
+ "source": "https://azure.microsoft.com/en-us/pricing/details/ai-document-intelligence/"
|
|
|
+ },
|
|
|
+ "azure_ai/doc-intelligence/prebuilt-document": {
|
|
|
+ "litellm_provider": "azure_ai",
|
|
|
+ "ocr_cost_per_page": 1e-2,
|
|
|
+ "mode": "ocr",
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/ocr"
|
|
|
+ ],
|
|
|
+ "source": "https://azure.microsoft.com/en-us/pricing/details/ai-document-intelligence/"
|
|
|
+ },
|
|
|
"azure_ai/MAI-DS-R1": {
|
|
|
"input_cost_per_token": 1.35e-06,
|
|
|
"litellm_provider": "azure_ai",
|
|
|
@@ -10042,6 +10069,96 @@
|
|
|
"supports_vision": true,
|
|
|
"supports_web_search": true
|
|
|
},
|
|
|
+ "gemini-live-2.5-flash-preview-native-audio-09-2025": {
|
|
|
+ "cache_read_input_token_cost": 7.5e-08,
|
|
|
+ "input_cost_per_audio_token": 3e-06,
|
|
|
+ "input_cost_per_token": 3e-07,
|
|
|
+ "litellm_provider": "vertex_ai-language-models",
|
|
|
+ "max_audio_length_hours": 8.4,
|
|
|
+ "max_audio_per_prompt": 1,
|
|
|
+ "max_images_per_prompt": 3000,
|
|
|
+ "max_input_tokens": 1048576,
|
|
|
+ "max_output_tokens": 65535,
|
|
|
+ "max_pdf_size_mb": 30,
|
|
|
+ "max_tokens": 65535,
|
|
|
+ "max_video_length": 1,
|
|
|
+ "max_videos_per_prompt": 10,
|
|
|
+ "mode": "chat",
|
|
|
+ "output_cost_per_audio_token": 1.2e-05,
|
|
|
+ "output_cost_per_token": 2e-06,
|
|
|
+ "source": "https://ai.google.dev/gemini-api/docs/pricing",
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/chat/completions",
|
|
|
+ "/v1/completions"
|
|
|
+ ],
|
|
|
+ "supported_modalities": [
|
|
|
+ "text",
|
|
|
+ "image",
|
|
|
+ "audio",
|
|
|
+ "video"
|
|
|
+ ],
|
|
|
+ "supported_output_modalities": [
|
|
|
+ "text",
|
|
|
+ "audio"
|
|
|
+ ],
|
|
|
+ "supports_audio_input": true,
|
|
|
+ "supports_audio_output": true,
|
|
|
+ "supports_function_calling": true,
|
|
|
+ "supports_parallel_function_calling": true,
|
|
|
+ "supports_pdf_input": true,
|
|
|
+ "supports_prompt_caching": true,
|
|
|
+ "supports_response_schema": true,
|
|
|
+ "supports_system_messages": true,
|
|
|
+ "supports_tool_choice": true,
|
|
|
+ "supports_url_context": true,
|
|
|
+ "supports_vision": true,
|
|
|
+ "supports_web_search": true
|
|
|
+ },
|
|
|
+ "gemini/gemini-live-2.5-flash-preview-native-audio-09-2025": {
|
|
|
+ "cache_read_input_token_cost": 7.5e-08,
|
|
|
+ "input_cost_per_audio_token": 3e-06,
|
|
|
+ "input_cost_per_token": 3e-07,
|
|
|
+ "litellm_provider": "gemini",
|
|
|
+ "max_audio_length_hours": 8.4,
|
|
|
+ "max_audio_per_prompt": 1,
|
|
|
+ "max_images_per_prompt": 3000,
|
|
|
+ "max_input_tokens": 1048576,
|
|
|
+ "max_output_tokens": 65535,
|
|
|
+ "max_pdf_size_mb": 30,
|
|
|
+ "max_tokens": 65535,
|
|
|
+ "max_video_length": 1,
|
|
|
+ "max_videos_per_prompt": 10,
|
|
|
+ "mode": "chat",
|
|
|
+ "output_cost_per_audio_token": 1.2e-05,
|
|
|
+ "output_cost_per_token": 2e-06,
|
|
|
+ "source": "https://ai.google.dev/gemini-api/docs/pricing",
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/chat/completions",
|
|
|
+ "/v1/completions"
|
|
|
+ ],
|
|
|
+ "supported_modalities": [
|
|
|
+ "text",
|
|
|
+ "image",
|
|
|
+ "audio",
|
|
|
+ "video"
|
|
|
+ ],
|
|
|
+ "supported_output_modalities": [
|
|
|
+ "text",
|
|
|
+ "audio"
|
|
|
+ ],
|
|
|
+ "supports_audio_input": true,
|
|
|
+ "supports_audio_output": true,
|
|
|
+ "supports_function_calling": true,
|
|
|
+ "supports_parallel_function_calling": true,
|
|
|
+ "supports_pdf_input": true,
|
|
|
+ "supports_prompt_caching": true,
|
|
|
+ "supports_response_schema": true,
|
|
|
+ "supports_system_messages": true,
|
|
|
+ "supports_tool_choice": true,
|
|
|
+ "supports_url_context": true,
|
|
|
+ "supports_vision": true,
|
|
|
+ "supports_web_search": true
|
|
|
+ },
|
|
|
"gemini-2.5-flash-lite-preview-06-17": {
|
|
|
"cache_read_input_token_cost": 2.5e-08,
|
|
|
"input_cost_per_audio_token": 5e-07,
|
|
|
@@ -18211,15 +18328,6 @@
|
|
|
"output_cost_per_token": 2e-07,
|
|
|
"supports_tool_choice": true
|
|
|
},
|
|
|
- "openrouter/nvidia/nemotron-nano-9b-v2:free": {
|
|
|
- "input_cost_per_token": 0,
|
|
|
- "litellm_provider": "openrouter",
|
|
|
- "max_tokens": 128000,
|
|
|
- "mode": "chat",
|
|
|
- "output_cost_per_token": 0,
|
|
|
- "source": "https://openrouter.ai/nvidia/nemotron-nano-9b-v2:free",
|
|
|
- "supports_tool_choice": true
|
|
|
- },
|
|
|
"openrouter/openai/gpt-3.5-turbo": {
|
|
|
"input_cost_per_token": 1.5e-06,
|
|
|
"litellm_provider": "openrouter",
|
|
|
@@ -22910,6 +23018,15 @@
|
|
|
"supports_function_calling": true,
|
|
|
"supports_tool_choice": true
|
|
|
},
|
|
|
+ "vertex_ai/mistral-ocr-2505": {
|
|
|
+ "litellm_provider": "vertex_ai",
|
|
|
+ "mode": "ocr",
|
|
|
+ "ocr_cost_per_page": 5e-4,
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/ocr"
|
|
|
+ ],
|
|
|
+ "source": "https://cloud.google.com/generative-ai-app-builder/pricing"
|
|
|
+ },
|
|
|
"vertex_ai/openai/gpt-oss-120b-maas": {
|
|
|
"input_cost_per_token": 1.5e-07,
|
|
|
"litellm_provider": "vertex_ai-openai_models",
|
|
|
@@ -24081,16 +24198,6 @@
|
|
|
"1280x720"
|
|
|
]
|
|
|
},
|
|
|
- "openai/container": {
|
|
|
- "code_interpreter_cost_per_session": 0.03,
|
|
|
- "litellm_provider": "openai",
|
|
|
- "mode": "container"
|
|
|
- },
|
|
|
- "azure/container": {
|
|
|
- "code_interpreter_cost_per_session": 0.03,
|
|
|
- "litellm_provider": "azure",
|
|
|
- "mode": "container"
|
|
|
- },
|
|
|
"azure/sora-2": {
|
|
|
"litellm_provider": "azure",
|
|
|
"mode": "video_generation",
|