|
|
@@ -11773,10 +11773,12 @@
|
|
|
"supports_web_search": true
|
|
|
},
|
|
|
"gemini-3-pro-preview": {
|
|
|
- "cache_read_input_token_cost": 1.25e-07,
|
|
|
+ "cache_read_input_token_cost": 2e-07,
|
|
|
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
|
"cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
|
|
|
"input_cost_per_token": 2e-06,
|
|
|
"input_cost_per_token_above_200k_tokens": 4e-06,
|
|
|
+ "input_cost_per_token_batches": 1e-06,
|
|
|
"litellm_provider": "vertex_ai-language-models",
|
|
|
"max_audio_length_hours": 8.4,
|
|
|
"max_audio_per_prompt": 1,
|
|
|
@@ -11790,10 +11792,60 @@
|
|
|
"mode": "chat",
|
|
|
"output_cost_per_token": 1.2e-05,
|
|
|
"output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
|
+ "output_cost_per_token_batches": 6e-06,
|
|
|
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
|
|
|
"supported_endpoints": [
|
|
|
"/v1/chat/completions",
|
|
|
- "/v1/completions"
|
|
|
+ "/v1/completions",
|
|
|
+ "/v1/batch"
|
|
|
+ ],
|
|
|
+ "supported_modalities": [
|
|
|
+ "text",
|
|
|
+ "image",
|
|
|
+ "audio",
|
|
|
+ "video"
|
|
|
+ ],
|
|
|
+ "supported_output_modalities": [
|
|
|
+ "text"
|
|
|
+ ],
|
|
|
+ "supports_audio_input": true,
|
|
|
+ "supports_function_calling": true,
|
|
|
+ "supports_pdf_input": true,
|
|
|
+ "supports_prompt_caching": true,
|
|
|
+ "supports_reasoning": true,
|
|
|
+ "supports_response_schema": true,
|
|
|
+ "supports_system_messages": true,
|
|
|
+ "supports_tool_choice": true,
|
|
|
+ "supports_video_input": true,
|
|
|
+ "supports_vision": true,
|
|
|
+ "supports_web_search": true
|
|
|
+ },
|
|
|
+ "vertex_ai/gemini-3-pro-preview": {
|
|
|
+ "cache_read_input_token_cost": 2e-07,
|
|
|
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
|
+ "cache_creation_input_token_cost_above_200k_tokens": 2.5e-07,
|
|
|
+ "input_cost_per_token": 2e-06,
|
|
|
+ "input_cost_per_token_above_200k_tokens": 4e-06,
|
|
|
+ "input_cost_per_token_batches": 1e-06,
|
|
|
+ "litellm_provider": "vertex_ai",
|
|
|
+ "max_audio_length_hours": 8.4,
|
|
|
+ "max_audio_per_prompt": 1,
|
|
|
+ "max_images_per_prompt": 3000,
|
|
|
+ "max_input_tokens": 1048576,
|
|
|
+ "max_output_tokens": 65535,
|
|
|
+ "max_pdf_size_mb": 30,
|
|
|
+ "max_tokens": 65535,
|
|
|
+ "max_video_length": 1,
|
|
|
+ "max_videos_per_prompt": 10,
|
|
|
+ "mode": "chat",
|
|
|
+ "output_cost_per_token": 1.2e-05,
|
|
|
+ "output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
|
+ "output_cost_per_token_batches": 6e-06,
|
|
|
+ "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
|
|
|
+ "supported_endpoints": [
|
|
|
+ "/v1/chat/completions",
|
|
|
+ "/v1/completions",
|
|
|
+ "/v1/batch"
|
|
|
],
|
|
|
"supported_modalities": [
|
|
|
"text",
|
|
|
@@ -13476,9 +13528,11 @@
|
|
|
"tpm": 800000
|
|
|
},
|
|
|
"gemini/gemini-3-pro-preview": {
|
|
|
- "cache_read_input_token_cost": 3.125e-07,
|
|
|
+ "cache_read_input_token_cost": 2e-07,
|
|
|
+ "cache_read_input_token_cost_above_200k_tokens": 4e-07,
|
|
|
"input_cost_per_token": 2e-06,
|
|
|
"input_cost_per_token_above_200k_tokens": 4e-06,
|
|
|
+ "input_cost_per_token_batches": 1e-06,
|
|
|
"litellm_provider": "gemini",
|
|
|
"max_audio_length_hours": 8.4,
|
|
|
"max_audio_per_prompt": 1,
|
|
|
@@ -13492,11 +13546,13 @@
|
|
|
"mode": "chat",
|
|
|
"output_cost_per_token": 1.2e-05,
|
|
|
"output_cost_per_token_above_200k_tokens": 1.8e-05,
|
|
|
+ "output_cost_per_token_batches": 6e-06,
|
|
|
"rpm": 2000,
|
|
|
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
|
|
|
"supported_endpoints": [
|
|
|
"/v1/chat/completions",
|
|
|
- "/v1/completions"
|
|
|
+ "/v1/completions",
|
|
|
+ "/v1/batch"
|
|
|
],
|
|
|
"supported_modalities": [
|
|
|
"text",
|