diff --git a/model_cost_data/model_prices_and_context_window.json b/model_cost_data/model_prices_and_context_window.json index e345815f..4795c6d8 100644 --- a/model_cost_data/model_prices_and_context_window.json +++ b/model_cost_data/model_prices_and_context_window.json @@ -15,6 +15,7 @@ "supports_prompt_caching": true, "supports_response_schema": true, "supports_system_messages": true, + "supports_reasoning": true, "supports_web_search": true, "search_context_cost_per_query": { "search_context_size_low": 0.0000, @@ -379,7 +380,9 @@ "supports_response_schema": true, "supports_tool_choice": true, "supports_native_streaming": false, + "supports_reasoning": true, "supported_modalities": ["text", "image"], + "supported_output_modalities": ["text"], "supported_endpoints": ["/v1/responses", "/v1/batch"] }, "o1-pro-2025-03-19": { @@ -400,7 +403,9 @@ "supports_response_schema": true, "supports_tool_choice": true, "supports_native_streaming": false, + "supports_reasoning": true, "supported_modalities": ["text", "image"], + "supported_output_modalities": ["text"], "supported_endpoints": ["/v1/responses", "/v1/batch"] }, "o1": { @@ -418,6 +423,7 @@ "supports_prompt_caching": true, "supports_system_messages": true, "supports_response_schema": true, + "supports_reasoning": true, "supports_tool_choice": true }, "o1-mini": { @@ -446,6 +452,7 @@ "supports_vision": false, "supports_prompt_caching": true, "supports_response_schema": true, + "supports_reasoning": true, "supports_tool_choice": true }, "o3-mini-2025-01-31": { @@ -462,6 +469,7 @@ "supports_vision": false, "supports_prompt_caching": true, "supports_response_schema": true, + "supports_reasoning": true, "supports_tool_choice": true }, "o1-mini-2024-09-12": { @@ -474,6 +482,7 @@ "litellm_provider": "openai", "mode": "chat", "supports_vision": true, + "supports_reasoning": true, "supports_prompt_caching": true }, "o1-preview": { @@ -486,6 +495,7 @@ "litellm_provider": "openai", "mode": "chat", "supports_vision": true, + "supports_reasoning": true, "supports_prompt_caching": true }, "o1-preview-2024-09-12": { @@ -498,6 +508,7 @@ "litellm_provider": "openai", "mode": "chat", "supports_vision": true, + "supports_reasoning": true, "supports_prompt_caching": true }, "o1-2024-12-17": { @@ -515,6 +526,7 @@ "supports_prompt_caching": true, "supports_system_messages": true, "supports_response_schema": true, + "supports_reasoning": true, "supports_tool_choice": true }, "chatgpt-4o-latest": { @@ -1286,6 +1298,68 @@ "supports_system_messages": true, "supports_tool_choice": true }, + "azure/gpt-4o-realtime-preview-2024-12-17": { + "max_tokens": 4096, + "max_input_tokens": 128000, + "max_output_tokens": 4096, + "input_cost_per_token": 0.000005, + "input_cost_per_audio_token": 0.00004, + "cache_read_input_token_cost": 0.0000025, + "output_cost_per_token": 0.00002, + "output_cost_per_audio_token": 0.00008, + "litellm_provider": "azure", + "mode": "chat", + "supported_modalities": ["text", "audio"], + "supported_output_modalities": ["text", "audio"], + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_audio_input": true, + "supports_audio_output": true, + "supports_system_messages": true, + "supports_tool_choice": true + }, + "azure/us/gpt-4o-realtime-preview-2024-12-17": { + "max_tokens": 4096, + "max_input_tokens": 128000, + "max_output_tokens": 4096, + "input_cost_per_token": 5.5e-6, + "input_cost_per_audio_token": 44e-6, + "cache_read_input_token_cost": 2.75e-6, + "cache_read_input_audio_token_cost": 2.5e-6, + "output_cost_per_token": 22e-6, + "output_cost_per_audio_token": 80e-6, + "litellm_provider": "azure", + "mode": "chat", + "supported_modalities": ["text", "audio"], + "supported_output_modalities": ["text", "audio"], + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_audio_input": true, + "supports_audio_output": true, + "supports_system_messages": true, + "supports_tool_choice": true + }, + "azure/eu/gpt-4o-realtime-preview-2024-12-17": { + "max_tokens": 4096, + "max_input_tokens": 128000, + "max_output_tokens": 4096, + "input_cost_per_token": 5.5e-6, + "input_cost_per_audio_token": 44e-6, + "cache_read_input_token_cost": 2.75e-6, + "cache_read_input_audio_token_cost": 2.5e-6, + "output_cost_per_token": 22e-6, + "output_cost_per_audio_token": 80e-6, + "litellm_provider": "azure", + "mode": "chat", + "supported_modalities": ["text", "audio"], + "supported_output_modalities": ["text", "audio"], + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_audio_input": true, + "supports_audio_output": true, + "supports_system_messages": true, + "supports_tool_choice": true + }, "azure/gpt-4o-realtime-preview-2024-10-01": { "max_tokens": 4096, "max_input_tokens": 128000, @@ -1352,6 +1426,7 @@ "cache_read_input_token_cost": 0.00000055, "litellm_provider": "azure", "mode": "chat", + "supports_reasoning": true, "supports_vision": false, "supports_prompt_caching": true, "supports_tool_choice": true @@ -1368,6 +1443,7 @@ "litellm_provider": "azure", "mode": "chat", "supports_vision": false, + "supports_reasoning": true, "supports_prompt_caching": true, "supports_tool_choice": true }, @@ -1383,6 +1459,7 @@ "litellm_provider": "azure", "mode": "chat", "supports_vision": false, + "supports_reasoning": true, "supports_prompt_caching": true, "supports_tool_choice": true }, @@ -1413,6 +1490,7 @@ "mode": "chat", "supports_vision": false, "supports_prompt_caching": true, + "supports_reasoning": true, "supports_response_schema": true, "supports_tool_choice": true }, @@ -1428,6 +1506,7 @@ "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, + "supports_reasoning": true, "supports_prompt_caching": true }, "azure/o1-mini-2024-09-12": { @@ -1442,6 +1521,7 @@ "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, + "supports_reasoning": true, "supports_prompt_caching": true }, "azure/us/o1-mini-2024-09-12": { @@ -1488,6 +1568,7 @@ "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, + "supports_reasoning": true, "supports_prompt_caching": true, "supports_tool_choice": true }, @@ -1503,6 +1584,7 @@ "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, + "supports_reasoning": true, "supports_prompt_caching": true, "supports_tool_choice": true }, @@ -1548,6 +1630,7 @@ "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, + "supports_reasoning": true, "supports_prompt_caching": true }, "azure/o1-preview-2024-09-12": { @@ -1562,6 +1645,7 @@ "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, + "supports_reasoning": true, "supports_prompt_caching": true }, "azure/us/o1-preview-2024-09-12": { @@ -2220,6 +2304,7 @@ "litellm_provider": "azure_ai", "mode": "chat", "supports_tool_choice": true, + "supports_reasoning": true, "source": "https://techcommunity.microsoft.com/blog/machinelearningblog/deepseek-r1-improved-performance-higher-limits-and-transparent-pricing/4386367" }, "azure_ai/deepseek-v3": { @@ -2300,6 +2385,18 @@ "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/000-000.mistral-ai-large-2407-offer?tab=Overview", "supports_tool_choice": true }, + "azure_ai/mistral-large-latest": { + "max_tokens": 4096, + "max_input_tokens": 128000, + "max_output_tokens": 4096, + "input_cost_per_token": 0.000002, + "output_cost_per_token": 0.000006, + "litellm_provider": "azure_ai", + "supports_function_calling": true, + "mode": "chat", + "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/000-000.mistral-ai-large-2407-offer?tab=Overview", + "supports_tool_choice": true + }, "azure_ai/ministral-3b": { "max_tokens": 4096, "max_input_tokens": 128000, @@ -2397,25 +2494,26 @@ "max_tokens": 4096, "max_input_tokens": 131072, "max_output_tokens": 4096, - "input_cost_per_token": 0, - "output_cost_per_token": 0, + "input_cost_per_token": 0.000000075, + "output_cost_per_token": 0.0000003, "litellm_provider": "azure_ai", "mode": "chat", "supports_function_calling": true, - "source": "https://learn.microsoft.com/en-us/azure/ai-foundry/concepts/models-featured#microsoft" + "source": "https://techcommunity.microsoft.com/blog/Azure-AI-Services-blog/announcing-new-phi-pricing-empowering-your-business-with-small-language-models/4395112" }, "azure_ai/Phi-4-multimodal-instruct": { "max_tokens": 4096, "max_input_tokens": 131072, "max_output_tokens": 4096, - "input_cost_per_token": 0, - "output_cost_per_token": 0, + "input_cost_per_token": 0.00000008, + "input_cost_per_audio_token": 0.000004, + "output_cost_per_token": 0.00032, "litellm_provider": "azure_ai", "mode": "chat", "supports_audio_input": true, "supports_function_calling": true, "supports_vision": true, - "source": "https://learn.microsoft.com/en-us/azure/ai-foundry/concepts/models-featured#microsoft" + "source": "https://techcommunity.microsoft.com/blog/Azure-AI-Services-blog/announcing-new-phi-pricing-empowering-your-business-with-small-language-models/4395112" }, "azure_ai/Phi-4": { "max_tokens": 16384, @@ -2907,6 +3005,7 @@ "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true, + "supports_reasoning": true, "supports_prompt_caching": true }, "deepseek/deepseek-chat": { @@ -3020,6 +3119,87 @@ "supports_vision": true, "supports_tool_choice": true }, + "xai/grok-3-beta": { + "max_tokens": 131072, + "max_input_tokens": 131072, + "max_output_tokens": 131072, + "input_cost_per_token": 0.000003, + "output_cost_per_token": 0.000015, + "litellm_provider": "xai", + "mode": "chat", + "supports_function_calling": true, + "supports_tool_choice": true, + "supports_response_schema": false, + "source": "https://x.ai/api#pricing" + }, + "xai/grok-3-fast-beta": { + "max_tokens": 131072, + "max_input_tokens": 131072, + "max_output_tokens": 131072, + "input_cost_per_token": 0.000005, + "output_cost_per_token": 0.000025, + "litellm_provider": "xai", + "mode": "chat", + "supports_function_calling": true, + "supports_tool_choice": true, + "supports_response_schema": false, + "source": "https://x.ai/api#pricing" + }, + "xai/grok-3-fast-latest": { + "max_tokens": 131072, + "max_input_tokens": 131072, + "max_output_tokens": 131072, + "input_cost_per_token": 0.000005, + "output_cost_per_token": 0.000025, + "litellm_provider": "xai", + "mode": "chat", + "supports_function_calling": true, + "supports_tool_choice": true, + "supports_response_schema": false, + "source": "https://x.ai/api#pricing" + }, + "xai/grok-3-mini-beta": { + "max_tokens": 131072, + "max_input_tokens": 131072, + "max_output_tokens": 131072, + "input_cost_per_token": 0.0000003, + "output_cost_per_token": 0.0000005, + "litellm_provider": "xai", + "mode": "chat", + "supports_function_calling": true, + "supports_tool_choice": true, + "supports_reasoning": true, + "supports_response_schema": false, + "source": "https://x.ai/api#pricing" + }, + "xai/grok-3-mini-fast-beta": { + "max_tokens": 131072, + "max_input_tokens": 131072, + "max_output_tokens": 131072, + "input_cost_per_token": 0.0000006, + "output_cost_per_token": 0.000004, + "litellm_provider": "xai", + "mode": "chat", + "supports_function_calling": true, + "supports_tool_choice": true, + "supports_reasoning": true, + "supports_response_schema": false, + "source": "https://x.ai/api#pricing" + }, + "xai/grok-3-mini-fast-latest": { + "max_tokens": 131072, + "max_input_tokens": 131072, + "max_output_tokens": 131072, + "input_cost_per_token": 0.0000006, + "output_cost_per_token": 0.000004, + "litellm_provider": "xai", + "mode": "chat", + "supports_reasoning": true, + "supports_function_calling": true, + "supports_tool_choice": true, + "supports_response_schema": false, + "source": "https://x.ai/api#pricing" + }, "xai/grok-vision-beta": { "max_tokens": 8192, "max_input_tokens": 8192, @@ -3090,6 +3270,7 @@ "mode": "chat", "supports_system_messages": false, "supports_function_calling": false, + "supports_reasoning": true, "supports_response_schema": false, "supports_tool_choice": true }, @@ -3455,7 +3636,7 @@ "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004, "cache_creation_input_token_cost": 0.000001, - "cache_read_input_token_cost": 0.0000008, + "cache_read_input_token_cost": 0.00000008, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, @@ -3601,7 +3782,8 @@ "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-06-01", - "supports_tool_choice": true + "supports_tool_choice": true, + "supports_reasoning": true }, "claude-3-7-sonnet-20250219": { "max_tokens": 128000, @@ -3621,7 +3803,8 @@ "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2026-02-01", - "supports_tool_choice": true + "supports_tool_choice": true, + "supports_reasoning": true }, "claude-3-5-sonnet-20241022": { "max_tokens": 8192, @@ -4499,20 +4682,10 @@ "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, - "input_cost_per_image": 0, - "input_cost_per_video_per_second": 0, - "input_cost_per_audio_per_second": 0, - "input_cost_per_token": 0, - "input_cost_per_character": 0, - "input_cost_per_token_above_128k_tokens": 0, - "input_cost_per_character_above_128k_tokens": 0, - "input_cost_per_image_above_128k_tokens": 0, - "input_cost_per_video_per_second_above_128k_tokens": 0, - "input_cost_per_audio_per_second_above_128k_tokens": 0, - "output_cost_per_token": 0, - "output_cost_per_character": 0, - "output_cost_per_token_above_128k_tokens": 0, - "output_cost_per_character_above_128k_tokens": 0, + "input_cost_per_token": 0.00000125, + "input_cost_per_token_above_200k_tokens": 0.0000025, + "output_cost_per_token": 0.00001, + "output_cost_per_token_above_200k_tokens": 0.000015, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, @@ -4523,6 +4696,9 @@ "supports_pdf_input": true, "supports_response_schema": true, "supports_tool_choice": true, + "supported_endpoints": ["/v1/chat/completions", "/v1/completions"], + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "gemini-2.0-pro-exp-02-05": { @@ -4535,20 +4711,10 @@ "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, - "input_cost_per_image": 0, - "input_cost_per_video_per_second": 0, - "input_cost_per_audio_per_second": 0, - "input_cost_per_token": 0, - "input_cost_per_character": 0, - "input_cost_per_token_above_128k_tokens": 0, - "input_cost_per_character_above_128k_tokens": 0, - "input_cost_per_image_above_128k_tokens": 0, - "input_cost_per_video_per_second_above_128k_tokens": 0, - "input_cost_per_audio_per_second_above_128k_tokens": 0, - "output_cost_per_token": 0, - "output_cost_per_character": 0, - "output_cost_per_token_above_128k_tokens": 0, - "output_cost_per_character_above_128k_tokens": 0, + "input_cost_per_token": 0.00000125, + "input_cost_per_token_above_200k_tokens": 0.0000025, + "output_cost_per_token": 0.00001, + "output_cost_per_token_above_200k_tokens": 0.000015, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, @@ -4559,6 +4725,9 @@ "supports_pdf_input": true, "supports_response_schema": true, "supports_tool_choice": true, + "supported_endpoints": ["/v1/chat/completions", "/v1/completions"], + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "gemini-2.0-flash-exp": { @@ -4592,6 +4761,8 @@ "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing", "supports_tool_choice": true }, @@ -4616,6 +4787,8 @@ "supports_response_schema": true, "supports_audio_output": true, "supports_tool_choice": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "gemini-2.0-flash-thinking-exp": { @@ -4649,6 +4822,8 @@ "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, @@ -4683,6 +4858,8 @@ "supports_vision": true, "supports_response_schema": false, "supports_audio_output": false, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, @@ -4708,6 +4885,7 @@ "supports_audio_output": true, "supports_audio_input": true, "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "supports_tool_choice": true, "source": "https://ai.google.dev/pricing#2_0flash" }, @@ -4730,6 +4908,32 @@ "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", + "supports_tool_choice": true + }, + "gemini-2.0-flash-lite-001": { + "max_input_tokens": 1048576, + "max_output_tokens": 8192, + "max_images_per_prompt": 3000, + "max_videos_per_prompt": 10, + "max_video_length": 1, + "max_audio_length_hours": 8.4, + "max_audio_per_prompt": 1, + "max_pdf_size_mb": 50, + "input_cost_per_audio_token": 0.000000075, + "input_cost_per_token": 0.000000075, + "output_cost_per_token": 0.0000003, + "litellm_provider": "vertex_ai-language-models", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_response_schema": true, + "supports_audio_output": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, @@ -4795,6 +4999,7 @@ "supports_audio_output": true, "supports_audio_input": true, "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "supports_tool_choice": true, "source": "https://ai.google.dev/pricing#2_0flash" }, @@ -4820,6 +5025,8 @@ "supports_response_schema": true, "supports_audio_output": true, "supports_tool_choice": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], "source": "https://ai.google.dev/gemini-api/docs/pricing#gemini-2.0-flash-lite" }, "gemini/gemini-2.0-flash-001": { @@ -4845,6 +5052,8 @@ "supports_response_schema": true, "supports_audio_output": false, "supports_tool_choice": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://ai.google.dev/pricing#2_0flash" }, "gemini/gemini-2.5-pro-preview-03-25": { @@ -4859,9 +5068,9 @@ "max_pdf_size_mb": 30, "input_cost_per_audio_token": 0.0000007, "input_cost_per_token": 0.00000125, - "input_cost_per_token_above_128k_tokens": 0.0000025, - "output_cost_per_token": 0.0000010, - "output_cost_per_token_above_128k_tokens": 0.000015, + "input_cost_per_token_above_200k_tokens": 0.0000025, + "output_cost_per_token": 0.00001, + "output_cost_per_token_above_200k_tokens": 0.000015, "litellm_provider": "gemini", "mode": "chat", "rpm": 10000, @@ -4872,6 +5081,8 @@ "supports_response_schema": true, "supports_audio_output": false, "supports_tool_choice": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], "source": "https://ai.google.dev/gemini-api/docs/pricing#gemini-2.5-pro-preview" }, "gemini/gemini-2.0-flash-exp": { @@ -4907,6 +5118,8 @@ "supports_audio_output": true, "tpm": 4000000, "rpm": 10, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, @@ -4933,6 +5146,8 @@ "supports_response_schema": true, "supports_audio_output": false, "supports_tool_choice": true, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash-lite" }, "gemini/gemini-2.0-flash-thinking-exp": { @@ -4968,6 +5183,8 @@ "supports_audio_output": true, "tpm": 4000000, "rpm": 10, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, @@ -5004,6 +5221,8 @@ "supports_audio_output": true, "tpm": 4000000, "rpm": 10, + "supported_modalities": ["text", "image", "audio", "video"], + "supported_output_modalities": ["text", "image"], "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, @@ -5163,6 +5382,7 @@ "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-06-01", + "supports_reasoning": true, "supports_tool_choice": true }, "vertex_ai/claude-3-haiku": { @@ -6480,6 +6700,7 @@ "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, + "supports_reasoning": true, "supports_tool_choice": true, "supports_prompt_caching": true }, @@ -6655,6 +6876,7 @@ "mode": "chat", "supports_function_calling": true, "supports_vision": true, + "supports_reasoning": true, "tool_use_system_prompt_tokens": 159, "supports_assistant_prefill": true, "supports_tool_choice": true @@ -6670,6 +6892,7 @@ "mode": "chat", "supports_function_calling": true, "supports_vision": true, + "supports_reasoning": true, "tool_use_system_prompt_tokens": 159, "supports_tool_choice": true }, @@ -6837,6 +7060,7 @@ "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, + "supports_reasoning": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_tool_choice": true @@ -6850,6 +7074,7 @@ "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, + "supports_reasoning": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_tool_choice": true @@ -7667,6 +7892,7 @@ "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, + "supports_reasoning": true, "supports_tool_choice": true }, "anthropic.claude-3-5-sonnet-20241022-v2:0": { @@ -7784,7 +8010,8 @@ "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, - "supports_tool_choice": true + "supports_tool_choice": true, + "supports_reasoning": true }, "us.anthropic.claude-3-haiku-20240307-v1:0": { "max_tokens": 4096, @@ -8444,7 +8671,8 @@ "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.0000020, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "bedrock/*/1-month-commitment/cohere.command-text-v14": { "max_tokens": 4096, @@ -8453,7 +8681,8 @@ "input_cost_per_second": 0.011, "output_cost_per_second": 0.011, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "bedrock/*/6-month-commitment/cohere.command-text-v14": { "max_tokens": 4096, @@ -8462,7 +8691,8 @@ "input_cost_per_second": 0.0066027, "output_cost_per_second": 0.0066027, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "cohere.command-light-text-v14": { "max_tokens": 4096, @@ -8471,7 +8701,8 @@ "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "bedrock/*/1-month-commitment/cohere.command-light-text-v14": { "max_tokens": 4096, @@ -8480,7 +8711,8 @@ "input_cost_per_second": 0.001902, "output_cost_per_second": 0.001902, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "bedrock/*/6-month-commitment/cohere.command-light-text-v14": { "max_tokens": 4096, @@ -8489,7 +8721,8 @@ "input_cost_per_second": 0.0011416, "output_cost_per_second": 0.0011416, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "cohere.command-r-plus-v1:0": { "max_tokens": 4096, @@ -8498,7 +8731,8 @@ "input_cost_per_token": 0.0000030, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "cohere.command-r-v1:0": { "max_tokens": 4096, @@ -8507,7 +8741,8 @@ "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "litellm_provider": "bedrock", - "mode": "chat" + "mode": "chat", + "supports_tool_choice": true }, "cohere.embed-english-v3": { "max_tokens": 512, @@ -8535,6 +8770,7 @@ "output_cost_per_token": 0.0000054, "litellm_provider": "bedrock_converse", "mode": "chat", + "supports_reasoning": true, "supports_function_calling": false, "supports_tool_choice": false @@ -10361,7 +10597,8 @@ "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Claude 3.7 conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_assistant_prefill": true, "supports_function_calling": true, - "supports_tool_choice": true + "supports_tool_choice": true, + "supports_reasoning": true }, "databricks/databricks-meta-llama-3-1-405b-instruct": { "max_tokens": 128000, @@ -10619,6 +10856,7 @@ "max_input_tokens": 32768, "max_output_tokens": 8192, "litellm_provider": "snowflake", + "supports_reasoning": true, "mode": "chat" }, "snowflake/snowflake-arctic": {