diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index 43dc57c3..fa493052 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -24431,6 +24431,300 @@ "output_cost_per_token": 1e-06, "supports_tool_choice": true }, + "replicate/openai/gpt-5": { + "input_cost_per_token": 1.25e-06, + "output_cost_per_token": 1.0e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicateopenai/gpt-oss-20b": { + "input_cost_per_token": 9.0e-08, + "output_cost_per_token": 3.6e-07, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/anthropic/claude-4.5-haiku": { + "input_cost_per_token": 1.0e-06, + "output_cost_per_token": 5.0e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true + }, + "replicate/ibm-granite/granite-3.3-8b-instruct": { + "input_cost_per_token": 3.0e-08, + "output_cost_per_token": 2.5e-07, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/openai/gpt-4o": { + "input_cost_per_token": 2.5e-06, + "output_cost_per_token": 1.0e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_audio_input": true, + "supports_audio_output": true + }, + "replicate/openai/o4-mini": { + "input_cost_per_token": 1.0e-06, + "output_cost_per_token": 4.0e-06, + "output_cost_per_reasoning_token": 4.0e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_reasoning": true, + "supports_system_messages": true + }, + "replicate/openai/o1-mini": { + "input_cost_per_token": 1.1e-06, + "output_cost_per_token": 4.4e-06, + "output_cost_per_reasoning_token": 4.4e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_reasoning": true, + "supports_system_messages": true + }, + "replicate/openai/o1": { + "input_cost_per_token": 1.5e-05, + "output_cost_per_token": 6.0e-05, + "output_cost_per_reasoning_token": 6.0e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_reasoning": true, + "supports_system_messages": true + }, + "replicate/openai/gpt-4o-mini": { + "input_cost_per_token": 1.5e-07, + "output_cost_per_token": 6.0e-07, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicate/qwen/qwen3-235b-a22b-instruct-2507": { + "input_cost_per_token": 2.64e-07, + "output_cost_per_token": 1.06e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/anthropic/claude-4-sonnet": { + "input_cost_per_token": 3.0e-06, + "output_cost_per_token": 1.5e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true + }, + "replicate/deepseek-ai/deepseek-v3": { + "input_cost_per_token": 1.45e-06, + "output_cost_per_token": 1.45e-06, + "litellm_provider": "replicate", + "mode": "chat", + "max_input_tokens": 65536, + "max_output_tokens": 8192, + "max_tokens": 8192, + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/anthropic/claude-3.7-sonnet": { + "input_cost_per_token": 3.0e-06, + "output_cost_per_token": 1.5e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true + }, + "replicate/anthropic/claude-3.5-haiku": { + "input_cost_per_token": 1.0e-06, + "output_cost_per_token": 5.0e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true + }, + "replicate/anthropic/claude-3.5-sonnet": { + "input_cost_per_token": 3.75e-06, + "output_cost_per_token": 1.875e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true + }, + "replicate/google/gemini-3-pro": { + "input_cost_per_token": 2.0e-06, + "output_cost_per_token": 1.2e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicate/anthropic/claude-4.5-sonnet": { + "input_cost_per_token": 3.0e-06, + "output_cost_per_token": 1.5e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true + }, + "replicate/openai/gpt-4.1": { + "input_cost_per_token": 2.0e-06, + "output_cost_per_token": 8.0e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicate/openai/gpt-4.1-nano": { + "input_cost_per_token": 1.0e-07, + "output_cost_per_token": 4.0e-07, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/openai/gpt-4.1-mini": { + "input_cost_per_token": 4.0e-07, + "output_cost_per_token": 1.6e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicate/openai/gpt-5-nano": { + "input_cost_per_token": 5.0e-08, + "output_cost_per_token": 4.0e-07, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/openai/gpt-5-mini": { + "input_cost_per_token": 2.5e-07, + "output_cost_per_token": 2.0e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicate/google/gemini-2.5-flash": { + "input_cost_per_token": 2.5e-06, + "output_cost_per_token": 2.5e-06, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_response_schema": true + }, + "replicate/openai/gpt-oss-120b": { + "input_cost_per_token": 1.8e-07, + "output_cost_per_token": 7.2e-07, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/deepseek-ai/deepseek-v3.1": { + "input_cost_per_token": 6.72e-07, + "output_cost_per_token": 2.016e-06, + "litellm_provider": "replicate", + "mode": "chat", + "max_input_tokens": 163840, + "max_output_tokens": 163840, + "max_tokens": 163840, + "supports_function_calling": true, + "supports_reasoning": true, + "supports_system_messages": true + }, + "replicate/xai/grok-4": { + "input_cost_per_token": 7.2e-06, + "output_cost_per_token": 3.6e-05, + "litellm_provider": "replicate", + "mode": "chat", + "supports_function_calling": true, + "supports_system_messages": true + }, + "replicate/deepseek-ai/deepseek-r1": { + "input_cost_per_token": 3.75e-06, + "output_cost_per_token": 1.0e-05, + "output_cost_per_reasoning_token": 1.0e-05, + "litellm_provider": "replicate", + "mode": "chat", + "max_input_tokens": 65536, + "max_output_tokens": 8192, + "max_tokens": 8192, + "supports_reasoning": true, + "supports_system_messages": true + }, "rerank-english-v2.0": { "input_cost_per_query": 0.002, "input_cost_per_token": 0.0, diff --git a/model_prices_and_context_window.sha256 b/model_prices_and_context_window.sha256 index b7566f76..a38dbc2e 100644 --- a/model_prices_and_context_window.sha256 +++ b/model_prices_and_context_window.sha256 @@ -1 +1 @@ -ca27fe3d359323d7ed94397dac12fa51ead323473e576a88be967f4224801d78 +80ee19a79e02446d2e4d7052244de03033566c89b76130ce9f62991eac1c18e6