diff --git a/internal/providers/configs/aihubmix.json b/internal/providers/configs/aihubmix.json index b61e384e9195af6010295271119549bbfdc2e86c..9912128e1fb78a77be6fae4cbd4d95ee3a04ce62 100644 --- a/internal/providers/configs/aihubmix.json +++ b/internal/providers/configs/aihubmix.json @@ -2195,6 +2195,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "qwen3-coder-next", + "name": "Qwen3 Coder Next", + "cost_per_1m_in": 0.137, + "cost_per_1m_out": 0.548, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0.137, + "context_window": 2000000, + "default_max_tokens": 64000, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "qwen3-coder-plus", "name": "Qwen3 Coder Plus", diff --git a/internal/providers/configs/huggingface.json b/internal/providers/configs/huggingface.json index 93d7fb65c6f5cd94dca330bc52342b7985a2e5fb..43540fcd0811278e72a9e507fc2cfce8ba722a27 100644 --- a/internal/providers/configs/huggingface.json +++ b/internal/providers/configs/huggingface.json @@ -150,19 +150,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "moonshotai/Kimi-K2.5:fireworks-ai", - "name": "moonshotai/Kimi-K2.5 (fireworks-ai)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "openai/gpt-oss-120b:cerebras", "name": "openai/gpt-oss-120b (cerebras)", diff --git a/internal/providers/configs/ionet.json b/internal/providers/configs/ionet.json index 3f64381e2822cb8f543c647d9961cd20172f6299..2a386cd2bf2863fa5774aa40b1c5f7f8c5353d08 100644 --- a/internal/providers/configs/ionet.json +++ b/internal/providers/configs/ionet.json @@ -29,10 +29,10 @@ { "id": "zai-org/GLM-4.7", "name": "GLM 4.7", - "cost_per_1m_in": 0.33, - "cost_per_1m_out": 1.54, - "cost_per_1m_in_cached": 0.165, - "cost_per_1m_out_cached": 0.66, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.4, + "cost_per_1m_in_cached": 0.15, + "cost_per_1m_out_cached": 0.6, "context_window": 200000, "default_max_tokens": 20000, "can_reason": true, diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index 388f4394329aa505d01a2916fde26c1bc666e812..1eba59014c4012bf0014bfa2dbee563a1f59b51d 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -509,25 +509,31 @@ { "id": "deepseek/deepseek-chat-v3-0324", "name": "DeepSeek: DeepSeek V3 0324", - "cost_per_1m_in": 0.27, - "cost_per_1m_out": 1.12, + "cost_per_1m_in": 0.77, + "cost_per_1m_out": 0.77, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.135, + "cost_per_1m_out_cached": 0, "context_window": 163840, - "default_max_tokens": 81920, - "can_reason": false, + "default_max_tokens": 65536, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", "supports_attachments": false, "options": {} }, { "id": "deepseek/deepseek-chat-v3.1", "name": "DeepSeek: DeepSeek V3.1", - "cost_per_1m_in": 0.21, - "cost_per_1m_out": 0.7899999999999999, + "cost_per_1m_in": 0.19999999999999998, + "cost_per_1m_out": 0.7999999999999999, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.1300000002, + "cost_per_1m_out_cached": 0.09999999999999999, "context_window": 163840, - "default_max_tokens": 16384, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -582,9 +588,9 @@ "cost_per_1m_in": 0.26, "cost_per_1m_out": 0.38, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0.13, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -601,7 +607,7 @@ "cost_per_1m_in": 0.27, "cost_per_1m_out": 0.41, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.27, + "cost_per_1m_out_cached": 0, "context_window": 163840, "default_max_tokens": 32768, "can_reason": true, @@ -724,7 +730,7 @@ "cost_per_1m_in_cached": 0.08333333333333334, "cost_per_1m_out_cached": 0.01, "context_window": 1048576, - "default_max_tokens": 32768, + "default_max_tokens": 32767, "can_reason": true, "reasoning_levels": [ "low", @@ -849,19 +855,6 @@ "supports_attachments": true, "options": {} }, - { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "cost_per_1m_in": 0.04, - "cost_per_1m_out": 0.15, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.02, - "context_window": 128000, - "default_max_tokens": 32768, - "can_reason": false, - "supports_attachments": true, - "options": {} - }, { "id": "google/gemma-3-27b-it:free", "name": "Google: Gemma 3 27B (free)", @@ -943,12 +936,12 @@ { "id": "meta-llama/llama-3.3-70b-instruct", "name": "Meta: Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.59, - "cost_per_1m_out": 0.7899999999999999, + "cost_per_1m_in": 0.25, + "cost_per_1m_out": 0.75, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 16384, + "default_max_tokens": 13107, "can_reason": false, "supports_attachments": false, "options": {} @@ -1017,9 +1010,9 @@ "cost_per_1m_in": 0.3, "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.029, + "cost_per_1m_out_cached": 0.03, "context_window": 204800, - "default_max_tokens": 20480, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -1231,6 +1224,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "mistralai/mistral-small-24b-instruct-2501", + "name": "Mistral: Mistral Small 3", + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.3, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32768, + "default_max_tokens": 1024, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "mistralai/mistral-small-3.1-24b-instruct:free", "name": "Mistral: Mistral Small 3.1 24B (free)", @@ -1354,9 +1360,9 @@ "cost_per_1m_in": 0.6, "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false, "options": {} @@ -1377,12 +1383,12 @@ { "id": "moonshotai/kimi-k2-thinking", "name": "MoonshotAI: Kimi K2 Thinking", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.5, + "cost_per_1m_in": 0.47, + "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, - "context_window": 262144, - "default_max_tokens": 131072, + "cost_per_1m_out_cached": 0.14100000000000001, + "context_window": 131072, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -1396,12 +1402,12 @@ { "id": "moonshotai/kimi-k2.5", "name": "MoonshotAI: Kimi K2.5", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 3, + "cost_per_1m_in": 0.5700000000000001, + "cost_per_1m_out": 2.8499999999999996, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.09999999999999999, + "cost_per_1m_out_cached": 0.095, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -1599,7 +1605,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.5, "context_window": 1047576, - "default_max_tokens": 16384, + "default_max_tokens": 104757, "can_reason": false, "supports_attachments": true, "options": {} @@ -1623,9 +1629,9 @@ "cost_per_1m_in": 0.09999999999999999, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.024999999999999998, + "cost_per_1m_out_cached": 0.03, "context_window": 1047576, - "default_max_tokens": 16384, + "default_max_tokens": 104757, "can_reason": false, "supports_attachments": true, "options": {} @@ -1816,9 +1822,9 @@ "cost_per_1m_in": 0.25, "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.03, + "cost_per_1m_out_cached": 0.024999999999999998, "context_window": 400000, - "default_max_tokens": 40000, + "default_max_tokens": 64000, "can_reason": true, "reasoning_levels": [ "low", @@ -1835,9 +1841,9 @@ "cost_per_1m_in": 0.049999999999999996, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.01, + "cost_per_1m_out_cached": 0.005, "context_window": 400000, - "default_max_tokens": 40000, + "default_max_tokens": 64000, "can_reason": true, "reasoning_levels": [ "low", @@ -1873,7 +1879,7 @@ "cost_per_1m_in": 1.25, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.13, + "cost_per_1m_out_cached": 0.125, "context_window": 400000, "default_max_tokens": 64000, "can_reason": true, @@ -2029,12 +2035,12 @@ { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", - "cost_per_1m_in": 0.039, - "cost_per_1m_out": 0.19, + "cost_per_1m_in": 0.04, + "cost_per_1m_out": 0.18, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.02, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -2086,8 +2092,8 @@ { "id": "openai/gpt-oss-20b", "name": "OpenAI: gpt-oss-20b", - "cost_per_1m_in": 0.049999999999999996, - "cost_per_1m_out": 0.19999999999999998, + "cost_per_1m_in": 0.03, + "cost_per_1m_out": 0.14, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, @@ -2428,19 +2434,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "qwen/qwen-2.5-7b-instruct", - "name": "Qwen: Qwen2.5 7B Instruct", - "cost_per_1m_in": 0.04, - "cost_per_1m_out": 0.09999999999999999, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.04, - "context_window": 128000, - "default_max_tokens": 4096, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "qwen/qwen3-14b", "name": "Qwen: Qwen3 14B", @@ -2482,12 +2475,12 @@ { "id": "qwen/qwen3-235b-a22b-2507", "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "cost_per_1m_in": 0.08, - "cost_per_1m_out": 0.55, + "cost_per_1m_in": 0.22, + "cost_per_1m_out": 0.88, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.04, + "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false, "options": {} @@ -2495,12 +2488,12 @@ { "id": "qwen/qwen3-235b-a22b-thinking-2507", "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, + "cost_per_1m_in": 0.11, + "cost_per_1m_out": 0.6, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 13107, + "cost_per_1m_out_cached": 0.055, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -2603,11 +2596,11 @@ { "id": "qwen/qwen3-8b", "name": "Qwen: Qwen3 8B", - "cost_per_1m_in": 0.117, - "cost_per_1m_out": 0.45499999999999996, + "cost_per_1m_in": 0.049999999999999996, + "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 131072, + "cost_per_1m_out_cached": 0.049999999999999996, + "context_window": 32000, "default_max_tokens": 4096, "can_reason": true, "reasoning_levels": [ @@ -2622,12 +2615,12 @@ { "id": "qwen/qwen3-coder-30b-a3b-instruct", "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "cost_per_1m_in": 0.07, - "cost_per_1m_out": 0.28, + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.3, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} @@ -2636,11 +2629,11 @@ "id": "qwen/qwen3-coder", "name": "Qwen: Qwen3 Coder 480B A35B", "cost_per_1m_in": 0.22, - "cost_per_1m_out": 1.7999999999999998, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.022, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} @@ -2687,12 +2680,12 @@ { "id": "qwen/qwen3-coder-next", "name": "Qwen: Qwen3 Coder Next", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 0.7999999999999999, + "cost_per_1m_in": 0.12, + "cost_per_1m_out": 0.75, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.06, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 32768, "can_reason": false, "supports_attachments": false, "options": {} @@ -2718,7 +2711,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.24, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": false, "options": {} @@ -2731,7 +2724,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -2745,12 +2738,12 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.14, - "cost_per_1m_out": 1.4, + "cost_per_1m_in": 0.09, + "cost_per_1m_out": 1.1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} @@ -2904,7 +2897,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 32000, "can_reason": true, "reasoning_levels": [ "low", @@ -3071,10 +3064,10 @@ { "id": "xiaomi/mimo-v2-flash", "name": "Xiaomi: MiMo-V2-Flash", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.09, + "cost_per_1m_out": 0.29, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.01, + "cost_per_1m_out_cached": 0.045, "context_window": 262144, "default_max_tokens": 32768, "can_reason": true, @@ -3122,12 +3115,12 @@ { "id": "z-ai/glm-4.5-air", "name": "Z.ai: GLM 4.5 Air", - "cost_per_1m_in": 0.14, - "cost_per_1m_out": 0.86, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.85, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.024999999999999998, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 49152, "can_reason": true, "reasoning_levels": [ "low", @@ -3179,12 +3172,12 @@ { "id": "z-ai/glm-4.6", "name": "Z.ai: GLM 4.6", - "cost_per_1m_in": 0.39, - "cost_per_1m_out": 1.9, + "cost_per_1m_in": 0.55, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.11, "context_window": 204800, - "default_max_tokens": 102400, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -3274,11 +3267,11 @@ { "id": "z-ai/glm-5", "name": "Z.ai: GLM 5", - "cost_per_1m_in": 1, - "cost_per_1m_out": 3.1999999999999997, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 2.5500000000000003, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.19999999999999998, - "context_window": 202800, + "cost_per_1m_out_cached": 0, + "context_window": 204800, "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [