diff --git a/internal/providers/configs/aihubmix.json b/internal/providers/configs/aihubmix.json index 16f2fd7d3a848624ce371184ac288f9448ccadb0..be5ebee561f981eb01dcb5bd3bdd927f0cde32b8 100644 --- a/internal/providers/configs/aihubmix.json +++ b/internal/providers/configs/aihubmix.json @@ -229,6 +229,24 @@ "default_reasoning_effort": "medium", "supports_attachments": true }, + { + "id": "baidu-deepseek-v4-flash", + "name": "Baidu DeepSeek V4 Flash", + "cost_per_1m_in": 0.142, + "cost_per_1m_out": 0.284, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0.0142, + "context_window": 1000000, + "default_max_tokens": 384000, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false + }, { "id": "claude-3-5-haiku", "name": "Claude 3.5 Haiku", @@ -2534,8 +2552,8 @@ "cost_per_1m_out": 3.9995, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.16084, - "context_window": 256000, - "default_max_tokens": 25600, + "context_window": 262144, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", diff --git a/internal/providers/configs/huggingface.json b/internal/providers/configs/huggingface.json index 262f4f8a588d560f3b2e85959872a550a36e2898..623d3280957d340ee1cfcd0cbb16df3a6b2833b8 100644 --- a/internal/providers/configs/huggingface.json +++ b/internal/providers/configs/huggingface.json @@ -7,6 +7,18 @@ "default_large_model_id": "moonshotai/Kimi-K2.5:fireworks-ai", "default_small_model_id": "openai/gpt-oss-20b:groq", "models": [ + { + "id": "MiniMaxAI/MiniMax-M2.5:fireworks-ai", + "name": "MiniMaxAI/MiniMax-M2.5 (fireworks-ai)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, { "id": "MiniMaxAI/MiniMax-M2.7:fireworks-ai", "name": "MiniMaxAI/MiniMax-M2.7 (fireworks-ai)", diff --git a/internal/providers/configs/ionet.json b/internal/providers/configs/ionet.json index 3c3aca670a472da7d2bfd046e225c48ace0c8d8a..fcc84a0563f1c5655a26d1e496f0440dfd85e423 100644 --- a/internal/providers/configs/ionet.json +++ b/internal/providers/configs/ionet.json @@ -94,8 +94,8 @@ { "id": "MiniMaxAI/MiniMax-M2.5", "name": "MiniMaxAI/MiniMax-M2.5", - "cost_per_1m_in": 0.118, - "cost_per_1m_out": 0.99, + "cost_per_1m_in": 0.2, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0.1, "cost_per_1m_out_cached": 0, "context_window": 196600, @@ -238,9 +238,9 @@ { "id": "zai-org/GLM-4.7", "name": "Z.ai: GLM 4.7", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 1.4, - "cost_per_1m_in_cached": 0.15, + "cost_per_1m_in": 0.5, + "cost_per_1m_out": 2, + "cost_per_1m_in_cached": 0.35, "cost_per_1m_out_cached": 0.6, "context_window": 202752, "default_max_tokens": 20275, @@ -274,7 +274,7 @@ { "id": "zai-org/GLM-5.1", "name": "Z.ai: GLM 5.1", - "cost_per_1m_in": 1.06, + "cost_per_1m_in": 1.5, "cost_per_1m_out": 4.4, "cost_per_1m_in_cached": 0.26, "cost_per_1m_out_cached": 0, diff --git a/internal/providers/configs/opencode-go.json b/internal/providers/configs/opencode-go.json index 320ce23ef9116aad80574b542825ffdd007acab0..fd796050c148671f40124a87f92ab1278c32ffd1 100644 --- a/internal/providers/configs/opencode-go.json +++ b/internal/providers/configs/opencode-go.json @@ -30,7 +30,7 @@ "name": "DeepSeek V4 Pro", "cost_per_1m_in": 1.74, "cost_per_1m_out": 3.48, - "cost_per_1m_in_cached": 0.14, + "cost_per_1m_in_cached": 0.01, "cost_per_1m_out_cached": 0, "context_window": 1000000, "default_max_tokens": 384000, @@ -158,7 +158,7 @@ "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0.08, "cost_per_1m_out_cached": 0, - "context_window": 262144, + "context_window": 1000000, "default_max_tokens": 128000, "can_reason": true, "reasoning_levels": [ diff --git a/internal/providers/configs/opencode-zen.json b/internal/providers/configs/opencode-zen.json index 51570294a17c2f0cca08626ac701a74d39eddb8f..03dbfda415fdd965582ed599108ce9eff12a00a1 100644 --- a/internal/providers/configs/opencode-zen.json +++ b/internal/providers/configs/opencode-zen.json @@ -25,18 +25,6 @@ "default_reasoning_effort": "medium", "supports_attachments": false }, - { - "id": "claude-3-5-haiku", - "name": "Claude Haiku 3.5", - "cost_per_1m_in": 0.8, - "cost_per_1m_out": 4, - "cost_per_1m_in_cached": 0.08, - "cost_per_1m_out_cached": 1, - "context_window": 200000, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": true - }, { "id": "claude-haiku-4-5", "name": "Claude Haiku 4.5", @@ -495,7 +483,7 @@ "cost_per_1m_in_cached": 0.5, "cost_per_1m_out_cached": 0, "context_window": 1050000, - "default_max_tokens": 130000, + "default_max_tokens": 128000, "can_reason": true, "reasoning_levels": [ "low", @@ -541,24 +529,6 @@ "default_reasoning_effort": "medium", "supports_attachments": true }, - { - "id": "gemini-3-pro", - "name": "Gemini 3 Pro", - "cost_per_1m_in": 2, - "cost_per_1m_out": 12, - "cost_per_1m_in_cached": 0.2, - "cost_per_1m_out_cached": 0, - "context_window": 1048576, - "default_max_tokens": 65536, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": true - }, { "id": "gemini-3.1-pro", "name": "Gemini 3.1 Pro Preview", diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index c3cc947c2542fdd06cf66e2e53acb78bd196a80e..d52e14f96a548fdd9f82dc29d0f2a8e39f252bf4 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -129,7 +129,7 @@ "cost_per_1m_in_cached": 3.75, "cost_per_1m_out_cached": 0.3, "context_window": 200000, - "default_max_tokens": 64000, + "default_max_tokens": 32000, "can_reason": true, "reasoning_levels": [ "low", @@ -550,10 +550,10 @@ { "id": "deepseek/deepseek-chat-v3.1", "name": "DeepSeek: DeepSeek V3.1", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 1.7, + "cost_per_1m_in": 0.21, + "cost_per_1m_out": 0.79, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.13, "context_window": 163840, "default_max_tokens": 16384, "can_reason": true, @@ -625,7 +625,7 @@ "cost_per_1m_in": 0.14, "cost_per_1m_out": 0.28, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.028, + "cost_per_1m_out_cached": 0.0028, "context_window": 1048576, "default_max_tokens": 192000, "can_reason": true, @@ -643,7 +643,7 @@ "cost_per_1m_in": 0.435, "cost_per_1m_out": 0.87, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.03625, + "cost_per_1m_out_cached": 0.00363, "context_window": 1048576, "default_max_tokens": 192000, "can_reason": true, @@ -907,6 +907,18 @@ "default_reasoning_effort": "medium", "supports_attachments": true }, + { + "id": "google/gemma-3-12b-it", + "name": "Google: Gemma 3 12B", + "cost_per_1m_in": 0.04, + "cost_per_1m_out": 0.13, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": true + }, { "id": "google/gemma-3-27b-it", "name": "Google: Gemma 3 27B", @@ -922,12 +934,12 @@ { "id": "google/gemma-4-26b-a4b-it", "name": "Google: Gemma 4 26B A4B ", - "cost_per_1m_in": 0.13, - "cost_per_1m_out": 0.4, + "cost_per_1m_in": 0.07, + "cost_per_1m_out": 0.35, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.04, "context_window": 262144, - "default_max_tokens": 65536, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -958,12 +970,12 @@ { "id": "google/gemma-4-31b-it", "name": "Google: Gemma 4 31B", - "cost_per_1m_in": 0.14, - "cost_per_1m_out": 0.4, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.38, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 65536, + "default_max_tokens": 8192, "can_reason": true, "reasoning_levels": [ "low", @@ -1113,7 +1125,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.03, "context_window": 204800, - "default_max_tokens": 65550, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -1258,12 +1270,12 @@ { "id": "mistralai/ministral-3b-2512", "name": "Mistral: Ministral 3 3B 2512", - "cost_per_1m_in": 0.1, - "cost_per_1m_out": 0.1, + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.01, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 65536, "can_reason": false, "supports_attachments": true }, @@ -1447,9 +1459,9 @@ "cost_per_1m_in": 0.6, "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.6, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 4096, "can_reason": false, "supports_attachments": false }, @@ -1474,10 +1486,10 @@ { "id": "moonshotai/kimi-k2.5", "name": "MoonshotAI: Kimi K2.5", - "cost_per_1m_in": 0.55, - "cost_per_1m_out": 3.25, + "cost_per_1m_in": 0.44, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0.22, "context_window": 262144, "default_max_tokens": 131072, "can_reason": true, @@ -1492,10 +1504,10 @@ { "id": "moonshotai/kimi-k2.6", "name": "MoonshotAI: Kimi K2.6", - "cost_per_1m_in": 0.95, - "cost_per_1m_out": 4, + "cost_per_1m_in": 1.2, + "cost_per_1m_out": 4.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.16, + "cost_per_1m_out_cached": 0.2, "context_window": 262144, "default_max_tokens": 26214, "can_reason": true, @@ -1777,7 +1789,7 @@ "cost_per_1m_in": 2.5, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 8192, "can_reason": false, @@ -1981,7 +1993,7 @@ "cost_per_1m_in": 1.25, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.125, + "cost_per_1m_out_cached": 0.13, "context_window": 400000, "default_max_tokens": 64000, "can_reason": true, @@ -2236,12 +2248,12 @@ { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 0.6, + "cost_per_1m_in": 0.039, + "cost_per_1m_out": 0.19, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -2272,10 +2284,10 @@ { "id": "openai/gpt-oss-20b", "name": "OpenAI: gpt-oss-20b", - "cost_per_1m_in": 0.05, - "cost_per_1m_out": 0.2, + "cost_per_1m_in": 0.03, + "cost_per_1m_out": 0.14, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.05, + "cost_per_1m_out_cached": 0, "context_window": 131072, "default_max_tokens": 65536, "can_reason": true, @@ -2506,8 +2518,8 @@ { "id": "qwen/qwen-2.5-72b-instruct", "name": "Qwen2.5 72B Instruct", - "cost_per_1m_in": 0.12, - "cost_per_1m_out": 0.39, + "cost_per_1m_in": 0.36, + "cost_per_1m_out": 0.4, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 32768, @@ -2623,6 +2635,24 @@ "can_reason": false, "supports_attachments": false }, + { + "id": "qwen/qwen3-14b", + "name": "Qwen: Qwen3 14B", + "cost_per_1m_in": 0.12, + "cost_per_1m_out": 0.24, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 40960, + "default_max_tokens": 8192, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false + }, { "id": "qwen/qwen3-235b-a22b", "name": "Qwen: Qwen3 235B A22B", @@ -2674,12 +2704,12 @@ { "id": "qwen/qwen3-30b-a3b", "name": "Qwen: Qwen3 30B A3B", - "cost_per_1m_in": 0.09, - "cost_per_1m_out": 0.45, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.52, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 40960, - "default_max_tokens": 10000, + "context_window": 131072, + "default_max_tokens": 4096, "can_reason": true, "reasoning_levels": [ "low", @@ -2758,22 +2788,22 @@ { "id": "qwen/qwen3-coder-30b-a3b-instruct", "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "cost_per_1m_in": 0.07, - "cost_per_1m_out": 0.28, + "cost_per_1m_in": 0.2925, + "cost_per_1m_out": 1.4625, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 32768, "can_reason": false, "supports_attachments": false }, { "id": "qwen/qwen3-coder", "name": "Qwen: Qwen3 Coder 480B A35B", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 1, + "cost_per_1m_in": 0.22, + "cost_per_1m_out": 1.8, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.1, + "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 32768, "can_reason": false, @@ -2806,10 +2836,10 @@ { "id": "qwen/qwen3-coder-next", "name": "Qwen: Qwen3 Coder Next", - "cost_per_1m_in": 0.14, + "cost_per_1m_in": 0.15, "cost_per_1m_out": 0.8, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.09, + "cost_per_1m_out_cached": 0.1, "context_window": 262144, "default_max_tokens": 131072, "can_reason": false, @@ -2902,12 +2932,12 @@ { "id": "qwen/qwen3-vl-235b-a22b-instruct", "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "cost_per_1m_in": 0.2, - "cost_per_1m_out": 0.88, + "cost_per_1m_in": 0.26, + "cost_per_1m_out": 1.04, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, - "context_window": 262144, - "default_max_tokens": 8192, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": true }, @@ -3007,9 +3037,9 @@ "cost_per_1m_in": 0.6, "cost_per_1m_out": 3.6, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.3, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -3040,10 +3070,10 @@ { "id": "qwen/qwen3.5-122b-a10b", "name": "Qwen: Qwen3.5-122B-A10B", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 2.4, + "cost_per_1m_in": 0.26, + "cost_per_1m_out": 2.08, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.3, + "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 32768, "can_reason": true, @@ -3058,10 +3088,10 @@ { "id": "qwen/qwen3.5-27b", "name": "Qwen: Qwen3.5-27B", - "cost_per_1m_in": 0.27, - "cost_per_1m_out": 2.16, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 2.4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.27, + "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 32768, "can_reason": true, @@ -3163,9 +3193,9 @@ "cost_per_1m_in": 0.1, "cost_per_1m_out": 0.3, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.02, - "context_window": 256000, - "default_max_tokens": 128000, + "cost_per_1m_out_cached": 0, + "context_window": 262144, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -3381,7 +3411,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.11, "context_window": 131072, - "default_max_tokens": 48000, + "default_max_tokens": 49152, "can_reason": true, "reasoning_levels": [ "low", @@ -3502,12 +3532,12 @@ { "id": "z-ai/glm-4.7-flash", "name": "Z.ai: GLM 4.7 Flash", - "cost_per_1m_in": 0.1, - "cost_per_1m_out": 0.43, + "cost_per_1m_in": 0.06, + "cost_per_1m_out": 0.4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.01, "context_window": 202752, - "default_max_tokens": 101376, + "default_max_tokens": 8192, "can_reason": true, "reasoning_levels": [ "low", @@ -3616,10 +3646,10 @@ { "id": "x-ai/grok-3", "name": "xAI: Grok 3", - "cost_per_1m_in": 3, - "cost_per_1m_out": 15, + "cost_per_1m_in": 5, + "cost_per_1m_out": 25, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.75, + "cost_per_1m_out_cached": 1.25, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -3628,10 +3658,10 @@ { "id": "x-ai/grok-3-beta", "name": "xAI: Grok 3 Beta", - "cost_per_1m_in": 3, - "cost_per_1m_out": 15, + "cost_per_1m_in": 5, + "cost_per_1m_out": 25, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.75, + "cost_per_1m_out_cached": 1.25, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false,