From c5069a06a4ec609ee62f3165aa12dcd09c4447bb Mon Sep 17 00:00:00 2001 From: "github-actions[bot]" <41898282+github-actions[bot]@users.noreply.github.com> Date: Tue, 13 Jan 2026 22:05:38 +0000 Subject: [PATCH] =?UTF-8?q?chore:=20=E5=90=8C=E6=AD=A5=E6=A8=A1=E5=9E=8B?= =?UTF-8?q?=E4=BB=B7=E6=A0=BC=E6=95=B0=E6=8D=AE=20(f12fec3516e45adc1566fd3?= =?UTF-8?q?05e063b03f3b3c2bcd97cb84be1a1c61f3df9d0ca)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- model_prices_and_context_window.json | 444 +++++++++++++------------ model_prices_and_context_window.sha256 | 2 +- 2 files changed, 240 insertions(+), 206 deletions(-) diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index f818a2c8..0b97d876 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -32552,8 +32552,8 @@ "novita/deepseek/deepseek-v3.2": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.69e-03, - "output_cost_per_token": 4e-03, + "input_cost_per_token": 2.69e-7, + "output_cost_per_token": 4e-7, "max_input_tokens": 163840, "max_output_tokens": 65536, "max_tokens": 65536, @@ -32562,15 +32562,15 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 1.345e-03, - "input_cost_per_token_cache_hit": 1.345e-03, + "cache_read_input_token_cost": 1.345e-7, + "input_cost_per_token_cache_hit": 1.345e-7, "supports_reasoning": true }, "novita/minimax/minimax-m2.1": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3e-03, - "output_cost_per_token": 1.2e-02, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 1.2e-06, "max_input_tokens": 204800, "max_output_tokens": 131072, "max_tokens": 131072, @@ -32579,15 +32579,14 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 3e-04, - "input_cost_per_token_cache_hit": 3e-04, - "supports_reasoning": true + "cache_read_input_token_cost": 3e-8, + "input_cost_per_token_cache_hit": 3e-8 }, "novita/zai-org/glm-4.7": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 6e-03, - "output_cost_per_token": 2.2e-02, + "input_cost_per_token": 6e-7, + "output_cost_per_token": 2.2e-06, "max_input_tokens": 204800, "max_output_tokens": 131072, "max_tokens": 131072, @@ -32596,15 +32595,15 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 1.1e-03, - "input_cost_per_token_cache_hit": 1.1e-03, + "cache_read_input_token_cost": 1.1e-7, + "input_cost_per_token_cache_hit": 1.1e-7, "supports_reasoning": true }, "novita/xiaomimimo/mimo-v2-flash": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1e-03, - "output_cost_per_token": 3e-03, + "input_cost_per_token": 1e-7, + "output_cost_per_token": 3e-7, "max_input_tokens": 262144, "max_output_tokens": 32000, "max_tokens": 32000, @@ -32613,15 +32612,15 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 2e-04, - "input_cost_per_token_cache_hit": 2e-04, + "cache_read_input_token_cost": 2e-8, + "input_cost_per_token_cache_hit": 2e-8, "supports_reasoning": true }, "novita/zai-org/autoglm-phone-9b-multilingual": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.5e-04, - "output_cost_per_token": 1.38e-03, + "input_cost_per_token": 3.5e-8, + "output_cost_per_token": 1.38e-7, "max_input_tokens": 65536, "max_output_tokens": 65536, "max_tokens": 65536, @@ -32631,8 +32630,8 @@ "novita/moonshotai/kimi-k2-thinking": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.8e-03, - "output_cost_per_token": 2e-02, + "input_cost_per_token": 6e-7, + "output_cost_per_token": 2.5e-06, "max_input_tokens": 262144, "max_output_tokens": 262144, "max_tokens": 262144, @@ -32646,8 +32645,8 @@ "novita/minimax/minimax-m2": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-03, - "output_cost_per_token": 9.6e-03, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 1.2e-06, "max_input_tokens": 204800, "max_output_tokens": 131072, "max_tokens": 131072, @@ -32655,15 +32654,15 @@ "supports_parallel_function_calling": true, "supports_tool_choice": true, "supports_system_messages": true, - "cache_read_input_token_cost": 2.4e-04, - "input_cost_per_token_cache_hit": 2.4e-04, + "cache_read_input_token_cost": 3e-8, + "input_cost_per_token_cache_hit": 3e-8, "supports_reasoning": true }, "novita/paddlepaddle/paddleocr-vl": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.6e-04, - "output_cost_per_token": 1.6e-04, + "input_cost_per_token": 2e-8, + "output_cost_per_token": 2e-8, "max_input_tokens": 16384, "max_output_tokens": 16384, "max_tokens": 16384, @@ -32673,8 +32672,8 @@ "novita/deepseek/deepseek-v3.2-exp": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.16e-03, - "output_cost_per_token": 3.28e-03, + "input_cost_per_token": 2.7e-7, + "output_cost_per_token": 4.1e-7, "max_input_tokens": 163840, "max_output_tokens": 65536, "max_tokens": 65536, @@ -32688,8 +32687,8 @@ "novita/qwen/qwen3-vl-235b-a22b-thinking": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 7.84e-03, - "output_cost_per_token": 3.16e-02, + "input_cost_per_token": 9.8e-7, + "output_cost_per_token": 3.95e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32700,8 +32699,8 @@ "novita/zai-org/glm-4.6v": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3e-03, - "output_cost_per_token": 9e-03, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 9e-7, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32711,15 +32710,15 @@ "supports_vision": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 5.5e-04, - "input_cost_per_token_cache_hit": 5.5e-04, + "cache_read_input_token_cost": 5.5e-8, + "input_cost_per_token_cache_hit": 5.5e-8, "supports_reasoning": true }, "novita/zai-org/glm-4.6": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.4e-03, - "output_cost_per_token": 1.76e-02, + "input_cost_per_token": 5.5e-7, + "output_cost_per_token": 2.2e-06, "max_input_tokens": 204800, "max_output_tokens": 131072, "max_tokens": 131072, @@ -32728,15 +32727,31 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 8.8e-04, - "input_cost_per_token_cache_hit": 8.8e-04, + "cache_read_input_token_cost": 1.1e-7, + "input_cost_per_token_cache_hit": 1.1e-7, "supports_reasoning": true }, + "novita/kwaipilot/kat-coder-pro": { + "litellm_provider": "novita", + "mode": "chat", + "input_cost_per_token": 3e-7, + "output_cost_per_token": 1.2e-06, + "max_input_tokens": 256000, + "max_output_tokens": 128000, + "max_tokens": 128000, + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_tool_choice": true, + "supports_system_messages": true, + "supports_response_schema": true, + "cache_read_input_token_cost": 6e-8, + "input_cost_per_token_cache_hit": 6e-8 + }, "novita/qwen/qwen3-next-80b-a3b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.2e-03, - "output_cost_per_token": 1.2e-02, + "input_cost_per_token": 1.5e-7, + "output_cost_per_token": 1.5e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32749,8 +32764,8 @@ "novita/qwen/qwen3-next-80b-a3b-thinking": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.2e-03, - "output_cost_per_token": 1.2e-02, + "input_cost_per_token": 1.5e-7, + "output_cost_per_token": 1.5e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32764,8 +32779,8 @@ "novita/deepseek/deepseek-ocr": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-04, - "output_cost_per_token": 2.4e-04, + "input_cost_per_token": 3e-8, + "output_cost_per_token": 3e-8, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -32777,8 +32792,8 @@ "novita/deepseek/deepseek-v3.1-terminus": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.16e-03, - "output_cost_per_token": 8e-03, + "input_cost_per_token": 2.7e-7, + "output_cost_per_token": 1e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32787,15 +32802,15 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 1.08e-03, - "input_cost_per_token_cache_hit": 1.08e-03, + "cache_read_input_token_cost": 1.35e-7, + "input_cost_per_token_cache_hit": 1.35e-7, "supports_reasoning": true }, "novita/qwen/qwen3-vl-235b-a22b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-03, - "output_cost_per_token": 1.2e-02, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 1.5e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32809,8 +32824,8 @@ "novita/qwen/qwen3-max": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.688e-02, - "output_cost_per_token": 6.76e-02, + "input_cost_per_token": 2.11e-06, + "output_cost_per_token": 8.45e-06, "max_input_tokens": 262144, "max_output_tokens": 65536, "max_tokens": 65536, @@ -32823,8 +32838,8 @@ "novita/skywork/r1v4-lite": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2e-03, - "output_cost_per_token": 6e-03, + "input_cost_per_token": 2e-7, + "output_cost_per_token": 6e-7, "max_input_tokens": 262144, "max_output_tokens": 65536, "max_tokens": 65536, @@ -32836,8 +32851,8 @@ "novita/deepseek/deepseek-v3.1": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.16e-03, - "output_cost_per_token": 8e-03, + "input_cost_per_token": 2.7e-7, + "output_cost_per_token": 1e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32846,15 +32861,15 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 1.08e-03, - "input_cost_per_token_cache_hit": 1.08e-03, + "cache_read_input_token_cost": 1.35e-7, + "input_cost_per_token_cache_hit": 1.35e-7, "supports_reasoning": true }, "novita/moonshotai/kimi-k2-0905": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.8e-03, - "output_cost_per_token": 2e-02, + "input_cost_per_token": 6e-7, + "output_cost_per_token": 2.5e-06, "max_input_tokens": 262144, "max_output_tokens": 262144, "max_tokens": 262144, @@ -32867,8 +32882,8 @@ "novita/qwen/qwen3-coder-480b-a35b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-03, - "output_cost_per_token": 1.04e-02, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 1.3e-06, "max_input_tokens": 262144, "max_output_tokens": 65536, "max_tokens": 65536, @@ -32881,8 +32896,8 @@ "novita/qwen/qwen3-coder-30b-a3b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 7e-04, - "output_cost_per_token": 2.7e-03, + "input_cost_per_token": 7e-8, + "output_cost_per_token": 2.7e-7, "max_input_tokens": 160000, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32895,8 +32910,8 @@ "novita/openai/gpt-oss-120b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4e-04, - "output_cost_per_token": 2e-03, + "input_cost_per_token": 5e-8, + "output_cost_per_token": 2.5e-7, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32911,8 +32926,8 @@ "novita/moonshotai/kimi-k2-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.56e-03, - "output_cost_per_token": 1.84e-02, + "input_cost_per_token": 5.7e-7, + "output_cost_per_token": 2.3e-06, "max_input_tokens": 131072, "max_output_tokens": 131072, "max_tokens": 131072, @@ -32925,8 +32940,8 @@ "novita/deepseek/deepseek-v3-0324": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.16e-03, - "output_cost_per_token": 8.96e-03, + "input_cost_per_token": 2.7e-7, + "output_cost_per_token": 1.12e-06, "max_input_tokens": 163840, "max_output_tokens": 163840, "max_tokens": 163840, @@ -32935,14 +32950,14 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 1.08e-03, - "input_cost_per_token_cache_hit": 1.08e-03 + "cache_read_input_token_cost": 1.35e-7, + "input_cost_per_token_cache_hit": 1.35e-7 }, "novita/zai-org/glm-4.5": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.8e-03, - "output_cost_per_token": 1.76e-02, + "input_cost_per_token": 6e-7, + "output_cost_per_token": 2.2e-06, "max_input_tokens": 131072, "max_output_tokens": 98304, "max_tokens": 98304, @@ -32950,15 +32965,15 @@ "supports_parallel_function_calling": true, "supports_tool_choice": true, "supports_system_messages": true, - "cache_read_input_token_cost": 8.8e-04, - "input_cost_per_token_cache_hit": 8.8e-04, + "cache_read_input_token_cost": 1.1e-7, + "input_cost_per_token_cache_hit": 1.1e-7, "supports_reasoning": true }, "novita/qwen/qwen3-235b-a22b-thinking-2507": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-03, - "output_cost_per_token": 2.4e-02, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 3e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -32971,8 +32986,8 @@ "novita/meta-llama/llama-3.1-8b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2e-04, - "output_cost_per_token": 5e-04, + "input_cost_per_token": 2e-8, + "output_cost_per_token": 5e-8, "max_input_tokens": 16384, "max_output_tokens": 16384, "max_tokens": 16384, @@ -32981,8 +32996,8 @@ "novita/google/gemma-3-12b-it": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4e-04, - "output_cost_per_token": 8e-04, + "input_cost_per_token": 5e-8, + "output_cost_per_token": 1e-7, "max_input_tokens": 131072, "max_output_tokens": 8192, "max_tokens": 8192, @@ -32994,8 +33009,8 @@ "novita/zai-org/glm-4.5v": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.8e-03, - "output_cost_per_token": 1.44e-02, + "input_cost_per_token": 6e-7, + "output_cost_per_token": 1.8e-06, "max_input_tokens": 65536, "max_output_tokens": 16384, "max_tokens": 16384, @@ -33005,15 +33020,15 @@ "supports_vision": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 8.8e-04, - "input_cost_per_token_cache_hit": 8.8e-04, + "cache_read_input_token_cost": 1.1e-7, + "input_cost_per_token_cache_hit": 1.1e-7, "supports_reasoning": true }, "novita/openai/gpt-oss-20b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.2e-04, - "output_cost_per_token": 1.2e-03, + "input_cost_per_token": 4e-8, + "output_cost_per_token": 1.5e-7, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -33026,8 +33041,8 @@ "novita/qwen/qwen3-235b-a22b-instruct-2507": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 7.2e-04, - "output_cost_per_token": 4.64e-03, + "input_cost_per_token": 9e-8, + "output_cost_per_token": 5.8e-7, "max_input_tokens": 131072, "max_output_tokens": 16384, "max_tokens": 16384, @@ -33040,8 +33055,8 @@ "novita/deepseek/deepseek-r1-distill-qwen-14b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.2e-03, - "output_cost_per_token": 1.2e-03, + "input_cost_per_token": 1.5e-7, + "output_cost_per_token": 1.5e-7, "max_input_tokens": 32768, "max_output_tokens": 16384, "max_tokens": 16384, @@ -33053,8 +33068,8 @@ "novita/meta-llama/llama-3.3-70b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.08e-03, - "output_cost_per_token": 3.2e-03, + "input_cost_per_token": 1.35e-7, + "output_cost_per_token": 4e-7, "max_input_tokens": 131072, "max_output_tokens": 120000, "max_tokens": 120000, @@ -33066,8 +33081,8 @@ "novita/qwen/qwen-2.5-72b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.04e-03, - "output_cost_per_token": 3.2e-03, + "input_cost_per_token": 3.8e-7, + "output_cost_per_token": 4e-7, "max_input_tokens": 32000, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33080,8 +33095,8 @@ "novita/mistralai/mistral-nemo": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.2e-04, - "output_cost_per_token": 1.36e-03, + "input_cost_per_token": 4e-8, + "output_cost_per_token": 1.7e-7, "max_input_tokens": 60288, "max_output_tokens": 16000, "max_tokens": 16000, @@ -33092,8 +33107,8 @@ "novita/minimaxai/minimax-m1-80k": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.4e-03, - "output_cost_per_token": 1.76e-02, + "input_cost_per_token": 5.5e-7, + "output_cost_per_token": 2.2e-06, "max_input_tokens": 1000000, "max_output_tokens": 40000, "max_tokens": 40000, @@ -33106,8 +33121,8 @@ "novita/deepseek/deepseek-r1-0528": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-03, - "output_cost_per_token": 2e-02, + "input_cost_per_token": 7e-7, + "output_cost_per_token": 2.5e-06, "max_input_tokens": 163840, "max_output_tokens": 32768, "max_tokens": 32768, @@ -33116,15 +33131,15 @@ "supports_tool_choice": true, "supports_system_messages": true, "supports_response_schema": true, - "cache_read_input_token_cost": 2.8e-03, - "input_cost_per_token_cache_hit": 2.8e-03, + "cache_read_input_token_cost": 3.5e-7, + "input_cost_per_token_cache_hit": 3.5e-7, "supports_reasoning": true }, "novita/deepseek/deepseek-r1-distill-qwen-32b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-03, - "output_cost_per_token": 2.4e-03, + "input_cost_per_token": 3e-7, + "output_cost_per_token": 3e-7, "max_input_tokens": 64000, "max_output_tokens": 32000, "max_tokens": 32000, @@ -33136,8 +33151,8 @@ "novita/meta-llama/llama-3-8b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.2e-04, - "output_cost_per_token": 3.2e-04, + "input_cost_per_token": 4e-8, + "output_cost_per_token": 4e-8, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33146,8 +33161,8 @@ "novita/microsoft/wizardlm-2-8x22b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.96e-03, - "output_cost_per_token": 4.96e-03, + "input_cost_per_token": 6.2e-7, + "output_cost_per_token": 6.2e-7, "max_input_tokens": 65535, "max_output_tokens": 8000, "max_tokens": 8000, @@ -33156,8 +33171,8 @@ "novita/deepseek/deepseek-r1-0528-qwen3-8b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 4.8e-04, - "output_cost_per_token": 7.2e-04, + "input_cost_per_token": 6e-8, + "output_cost_per_token": 9e-8, "max_input_tokens": 128000, "max_output_tokens": 32000, "max_tokens": 32000, @@ -33167,8 +33182,8 @@ "novita/deepseek/deepseek-r1-distill-llama-70b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 6.4e-03, - "output_cost_per_token": 6.4e-03, + "input_cost_per_token": 8e-7, + "output_cost_per_token": 8e-7, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33180,8 +33195,8 @@ "novita/meta-llama/llama-3-70b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.1e-03, - "output_cost_per_token": 7.4e-03, + "input_cost_per_token": 5.1e-7, + "output_cost_per_token": 7.4e-7, "max_input_tokens": 8192, "max_output_tokens": 8000, "max_tokens": 8000, @@ -33192,8 +33207,8 @@ "novita/qwen/qwen3-235b-a22b-fp8": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.6e-03, - "output_cost_per_token": 6.4e-03, + "input_cost_per_token": 2e-7, + "output_cost_per_token": 8e-7, "max_input_tokens": 40960, "max_output_tokens": 20000, "max_tokens": 20000, @@ -33203,8 +33218,8 @@ "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.6e-03, - "output_cost_per_token": 7.2e-03, + "input_cost_per_token": 2.7e-7, + "output_cost_per_token": 8.5e-7, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33214,8 +33229,8 @@ "novita/meta-llama/llama-4-scout-17b-16e-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 8e-04, - "output_cost_per_token": 4e-03, + "input_cost_per_token": 1.8e-7, + "output_cost_per_token": 5.9e-7, "max_input_tokens": 131072, "max_output_tokens": 131072, "max_tokens": 131072, @@ -33225,8 +33240,8 @@ "novita/nousresearch/hermes-2-pro-llama-3-8b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.4e-03, - "output_cost_per_token": 1.4e-03, + "input_cost_per_token": 1.4e-7, + "output_cost_per_token": 1.4e-7, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33237,8 +33252,8 @@ "novita/qwen/qwen2.5-vl-72b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 6.4e-03, - "output_cost_per_token": 6.4e-03, + "input_cost_per_token": 8e-7, + "output_cost_per_token": 8e-7, "max_input_tokens": 32768, "max_output_tokens": 32768, "max_tokens": 32768, @@ -33248,8 +33263,8 @@ "novita/sao10k/l3-70b-euryale-v2.1": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.48e-02, - "output_cost_per_token": 1.48e-02, + "input_cost_per_token": 1.48e-06, + "output_cost_per_token": 1.48e-06, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33261,8 +33276,8 @@ "novita/baidu/ernie-4.5-21B-a3b-thinking": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-04, - "output_cost_per_token": 2.24e-03, + "input_cost_per_token": 7e-8, + "output_cost_per_token": 2.8e-7, "max_input_tokens": 131072, "max_output_tokens": 65536, "max_tokens": 65536, @@ -33272,8 +33287,8 @@ "novita/sao10k/l3-8b-lunaris": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5e-04, - "output_cost_per_token": 5e-04, + "input_cost_per_token": 5e-8, + "output_cost_per_token": 5e-8, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33284,33 +33299,18 @@ "novita/baichuan/baichuan-m2-32b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-04, - "output_cost_per_token": 5.6e-04, + "input_cost_per_token": 7e-8, + "output_cost_per_token": 7e-8, "max_input_tokens": 131072, "max_output_tokens": 131072, "max_tokens": 131072, - "supports_tool_choice": true, - "supports_system_messages": true, - "supports_response_schema": true, - "supports_reasoning": true - }, - "novita/thudm/glm-4.1v-9b-thinking": { - "litellm_provider": "novita", - "mode": "chat", - "input_cost_per_token": 2.8e-04, - "output_cost_per_token": 1.104e-03, - "max_input_tokens": 65536, - "max_output_tokens": 8000, - "max_tokens": 8000, - "supports_vision": true, - "supports_system_messages": true, - "supports_reasoning": true + "supports_system_messages": true }, "novita/baidu/ernie-4.5-vl-424b-a47b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.36e-03, - "output_cost_per_token": 1e-02, + "input_cost_per_token": 4.2e-7, + "output_cost_per_token": 1.25e-06, "max_input_tokens": 123000, "max_output_tokens": 16000, "max_tokens": 16000, @@ -33321,8 +33321,8 @@ "novita/baidu/ernie-4.5-300b-a47b-paddle": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.24e-03, - "output_cost_per_token": 8.8e-03, + "input_cost_per_token": 2.8e-7, + "output_cost_per_token": 1.1e-06, "max_input_tokens": 123000, "max_output_tokens": 12000, "max_tokens": 12000, @@ -33333,8 +33333,8 @@ "novita/deepseek/deepseek-prover-v2-671b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-03, - "output_cost_per_token": 2e-02, + "input_cost_per_token": 7e-7, + "output_cost_per_token": 2.5e-06, "max_input_tokens": 160000, "max_output_tokens": 160000, "max_tokens": 160000, @@ -33343,8 +33343,8 @@ "novita/qwen/qwen3-32b-fp8": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 8e-04, - "output_cost_per_token": 3.6e-03, + "input_cost_per_token": 1e-7, + "output_cost_per_token": 4.5e-7, "max_input_tokens": 40960, "max_output_tokens": 20000, "max_tokens": 20000, @@ -33354,8 +33354,8 @@ "novita/qwen/qwen3-30b-a3b-fp8": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 7.2e-04, - "output_cost_per_token": 3.6e-03, + "input_cost_per_token": 9e-8, + "output_cost_per_token": 4.5e-7, "max_input_tokens": 40960, "max_output_tokens": 20000, "max_tokens": 20000, @@ -33365,8 +33365,8 @@ "novita/google/gemma-3-27b-it": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 9.52e-04, - "output_cost_per_token": 1.6e-03, + "input_cost_per_token": 1.19e-7, + "output_cost_per_token": 2e-7, "max_input_tokens": 98304, "max_output_tokens": 16384, "max_tokens": 16384, @@ -33376,8 +33376,8 @@ "novita/deepseek/deepseek-v3-turbo": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.2e-03, - "output_cost_per_token": 1.04e-02, + "input_cost_per_token": 4e-7, + "output_cost_per_token": 1.3e-06, "max_input_tokens": 64000, "max_output_tokens": 16000, "max_tokens": 16000, @@ -33389,8 +33389,8 @@ "novita/deepseek/deepseek-r1-turbo": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-03, - "output_cost_per_token": 2e-02, + "input_cost_per_token": 7e-7, + "output_cost_per_token": 2.5e-06, "max_input_tokens": 64000, "max_output_tokens": 16000, "max_tokens": 16000, @@ -33403,8 +33403,8 @@ "novita/Sao10K/L3-8B-Stheno-v3.2": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5e-04, - "output_cost_per_token": 5e-04, + "input_cost_per_token": 5e-8, + "output_cost_per_token": 5e-8, "max_input_tokens": 8192, "max_output_tokens": 32000, "max_tokens": 32000, @@ -33416,8 +33416,8 @@ "novita/gryphe/mythomax-l2-13b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 7.2e-04, - "output_cost_per_token": 7.2e-04, + "input_cost_per_token": 9e-8, + "output_cost_per_token": 9e-8, "max_input_tokens": 4096, "max_output_tokens": 3200, "max_tokens": 3200, @@ -33426,8 +33426,8 @@ "novita/baidu/ernie-4.5-vl-28b-a3b-thinking": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 3.9e-03, - "output_cost_per_token": 3.9e-03, + "input_cost_per_token": 3.9e-7, + "output_cost_per_token": 3.9e-7, "max_input_tokens": 131072, "max_output_tokens": 65536, "max_tokens": 65536, @@ -33442,8 +33442,8 @@ "novita/qwen/qwen3-vl-8b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 6.4e-04, - "output_cost_per_token": 4e-03, + "input_cost_per_token": 8e-8, + "output_cost_per_token": 5e-7, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -33457,8 +33457,8 @@ "novita/zai-org/glm-4.5-air": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.04e-03, - "output_cost_per_token": 6.8e-03, + "input_cost_per_token": 1.3e-7, + "output_cost_per_token": 8.5e-7, "max_input_tokens": 131072, "max_output_tokens": 98304, "max_tokens": 98304, @@ -33471,8 +33471,8 @@ "novita/qwen/qwen3-vl-30b-a3b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.6e-03, - "output_cost_per_token": 5.6e-03, + "input_cost_per_token": 2e-7, + "output_cost_per_token": 7e-7, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -33486,8 +33486,8 @@ "novita/qwen/qwen3-vl-30b-a3b-thinking": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.6e-03, - "output_cost_per_token": 8e-03, + "input_cost_per_token": 2e-7, + "output_cost_per_token": 1e-06, "max_input_tokens": 131072, "max_output_tokens": 32768, "max_tokens": 32768, @@ -33498,11 +33498,45 @@ "supports_system_messages": true, "supports_response_schema": true }, + "novita/qwen/qwen3-omni-30b-a3b-thinking": { + "litellm_provider": "novita", + "mode": "chat", + "input_cost_per_token": 2.5e-7, + "output_cost_per_token": 9.7e-7, + "max_input_tokens": 65536, + "max_output_tokens": 16384, + "max_tokens": 16384, + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_tool_choice": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_response_schema": true, + "supports_reasoning": true, + "supports_audio_input": true + }, + "novita/qwen/qwen3-omni-30b-a3b-instruct": { + "litellm_provider": "novita", + "mode": "chat", + "input_cost_per_token": 2.5e-7, + "output_cost_per_token": 9.7e-7, + "max_input_tokens": 65536, + "max_output_tokens": 16384, + "max_tokens": 16384, + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_tool_choice": true, + "supports_vision": true, + "supports_system_messages": true, + "supports_response_schema": true, + "supports_audio_input": true, + "supports_audio_output": true + }, "novita/qwen/qwen-mt-plus": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2e-03, - "output_cost_per_token": 6e-03, + "input_cost_per_token": 2.5e-7, + "output_cost_per_token": 7.5e-7, "max_input_tokens": 16384, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33511,8 +33545,8 @@ "novita/baidu/ernie-4.5-vl-28b-a3b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.12e-03, - "output_cost_per_token": 4.48e-03, + "input_cost_per_token": 1.4e-7, + "output_cost_per_token": 5.6e-7, "max_input_tokens": 30000, "max_output_tokens": 8000, "max_tokens": 8000, @@ -33526,8 +33560,8 @@ "novita/baidu/ernie-4.5-21B-a3b": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-04, - "output_cost_per_token": 2.24e-03, + "input_cost_per_token": 7e-8, + "output_cost_per_token": 2.8e-7, "max_input_tokens": 120000, "max_output_tokens": 8000, "max_tokens": 8000, @@ -33539,8 +33573,8 @@ "novita/qwen/qwen3-8b-fp8": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.8e-04, - "output_cost_per_token": 1.104e-03, + "input_cost_per_token": 3.5e-8, + "output_cost_per_token": 1.38e-7, "max_input_tokens": 128000, "max_output_tokens": 20000, "max_tokens": 20000, @@ -33550,8 +33584,8 @@ "novita/qwen/qwen3-4b-fp8": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-04, - "output_cost_per_token": 2.4e-04, + "input_cost_per_token": 3e-8, + "output_cost_per_token": 3e-8, "max_input_tokens": 128000, "max_output_tokens": 20000, "max_tokens": 20000, @@ -33561,8 +33595,8 @@ "novita/qwen/qwen2.5-7b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 5.6e-04, - "output_cost_per_token": 5.6e-04, + "input_cost_per_token": 7e-8, + "output_cost_per_token": 7e-8, "max_input_tokens": 32000, "max_output_tokens": 32000, "max_tokens": 32000, @@ -33575,8 +33609,8 @@ "novita/meta-llama/llama-3.2-3b-instruct": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 2.4e-04, - "output_cost_per_token": 4e-04, + "input_cost_per_token": 3e-8, + "output_cost_per_token": 5e-8, "max_input_tokens": 32768, "max_output_tokens": 32000, "max_tokens": 32000, @@ -33588,8 +33622,8 @@ "novita/sao10k/l31-70b-euryale-v2.2": { "litellm_provider": "novita", "mode": "chat", - "input_cost_per_token": 1.48e-02, - "output_cost_per_token": 1.48e-02, + "input_cost_per_token": 1.48e-06, + "output_cost_per_token": 1.48e-06, "max_input_tokens": 8192, "max_output_tokens": 8192, "max_tokens": 8192, @@ -33601,7 +33635,7 @@ "novita/qwen/qwen3-embedding-0.6b": { "litellm_provider": "novita", "mode": "embedding", - "input_cost_per_token": 5.6e-04, + "input_cost_per_token": 7e-8, "output_cost_per_token": 0, "max_input_tokens": 32768, "max_output_tokens": 32768, @@ -33610,7 +33644,7 @@ "novita/qwen/qwen3-embedding-8b": { "litellm_provider": "novita", "mode": "embedding", - "input_cost_per_token": 5.6e-04, + "input_cost_per_token": 7e-8, "output_cost_per_token": 0, "max_input_tokens": 32768, "max_output_tokens": 4096, @@ -33619,8 +33653,8 @@ "novita/baai/bge-m3": { "litellm_provider": "novita", "mode": "embedding", - "input_cost_per_token": 1e-04, - "output_cost_per_token": 1e-04, + "input_cost_per_token": 1e-8, + "output_cost_per_token": 1e-8, "max_input_tokens": 8192, "max_output_tokens": 96000, "max_tokens": 96000 @@ -33628,8 +33662,8 @@ "novita/qwen/qwen3-reranker-8b": { "litellm_provider": "novita", "mode": "rerank", - "input_cost_per_token": 4e-04, - "output_cost_per_token": 4e-04, + "input_cost_per_token": 5e-8, + "output_cost_per_token": 5e-8, "max_input_tokens": 32768, "max_output_tokens": 4096, "max_tokens": 4096 @@ -33637,8 +33671,8 @@ "novita/baai/bge-reranker-v2-m3": { "litellm_provider": "novita", "mode": "rerank", - "input_cost_per_token": 1e-04, - "output_cost_per_token": 1e-04, + "input_cost_per_token": 1e-8, + "output_cost_per_token": 1e-8, "max_input_tokens": 8000, "max_output_tokens": 8000, "max_tokens": 8000 diff --git a/model_prices_and_context_window.sha256 b/model_prices_and_context_window.sha256 index 0f035461..6aae8cc5 100644 --- a/model_prices_and_context_window.sha256 +++ b/model_prices_and_context_window.sha256 @@ -1 +1 @@ -4c03542df14124d9bba491d2a37f235b1d22a005ab17c74168fbdeef53e34d07 +f12fec3516e45adc1566fd305e063b03f3b3c2bcd97cb84be1a1c61f3df9d0ca