diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index 9830b1d6de30f2e86a27edc7031fb441a638442f..c1af57f10943e90c715682ae28c65a8350bcffca 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -532,19 +532,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "deepseek/deepseek-chat-v3-0324", - "name": "DeepSeek: DeepSeek V3 0324", - "cost_per_1m_in": 0.9, - "cost_per_1m_out": 0.9, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 163840, - "default_max_tokens": 16384, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "deepseek/deepseek-chat-v3.1", "name": "DeepSeek: DeepSeek V3.1", @@ -586,11 +573,11 @@ { "id": "deepseek/deepseek-v3.1-terminus:exacto", "name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", - "cost_per_1m_in": 0.21, - "cost_per_1m_out": 0.7899999999999999, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.16799999999999998, - "context_window": 163840, + "cost_per_1m_out_cached": 0, + "context_window": 131072, "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ @@ -606,11 +593,11 @@ "id": "deepseek/deepseek-v3.2", "name": "DeepSeek: DeepSeek V3.2", "cost_per_1m_in": 0.27, - "cost_per_1m_out": 0.39999999999999997, + "cost_per_1m_out": 0.41, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.216, + "cost_per_1m_out_cached": 0, "context_window": 163840, - "default_max_tokens": 16384, + "default_max_tokens": 8192, "can_reason": true, "reasoning_levels": [ "low", @@ -662,12 +649,12 @@ { "id": "deepseek/deepseek-r1-0528", "name": "DeepSeek: R1 0528", - "cost_per_1m_in": 2.5500000000000003, - "cost_per_1m_out": 5.95, + "cost_per_1m_in": 0.39999999999999997, + "cost_per_1m_out": 1.75, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 163840, - "default_max_tokens": 65536, + "default_max_tokens": 81920, "can_reason": true, "reasoning_levels": [ "low", @@ -761,7 +748,7 @@ "cost_per_1m_in": 0.09999999999999999, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0.18330000000000002, - "cost_per_1m_out_cached": 0.024999999999999998, + "cost_per_1m_out_cached": 0.01, "context_window": 1048576, "default_max_tokens": 32767, "can_reason": true, @@ -922,7 +909,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 256000, - "default_max_tokens": 16000, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": false, "options": {} @@ -969,12 +956,12 @@ { "id": "meta-llama/llama-3.1-8b-instruct", "name": "Meta: Llama 3.1 8B Instruct", - "cost_per_1m_in": 0.02, - "cost_per_1m_out": 0.03, + "cost_per_1m_in": 0.03, + "cost_per_1m_out": 0.09, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 8192, + "default_max_tokens": 13107, "can_reason": false, "supports_attachments": false, "options": {} @@ -996,11 +983,11 @@ "id": "meta-llama/llama-3.3-70b-instruct", "name": "Meta: Llama 3.3 70B Instruct", "cost_per_1m_in": 0.13, - "cost_per_1m_out": 0.39999999999999997, + "cost_per_1m_out": 0.38, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false, "options": {} @@ -1086,12 +1073,12 @@ { "id": "minimax/minimax-m2", "name": "MiniMax: MiniMax M2", - "cost_per_1m_in": 0.27, - "cost_per_1m_out": 1.15, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 26214, + "cost_per_1m_out_cached": 0.03, + "context_window": 204800, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -1141,19 +1128,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "mistralai/mistral-small", - "name": "Mistral Small", - "cost_per_1m_in": 0.19999999999999998, - "cost_per_1m_out": 0.6, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 3276, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "mistralai/mistral-tiny", "name": "Mistral Tiny", @@ -1167,19 +1141,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "mistralai/codestral-2501", - "name": "Mistral: Codestral 2501", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.8999999999999999, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 256000, - "default_max_tokens": 25600, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "mistralai/codestral-2508", "name": "Mistral: Codestral 2508", @@ -1220,8 +1181,8 @@ "options": {} }, { - "id": "mistralai/magistral-medium-2506", - "name": "Mistral: Magistral Medium 2506", + "id": "mistralai/magistral-medium-2506:thinking", + "name": "Mistral: Magistral Medium 2506 (thinking)", "cost_per_1m_in": 2, "cost_per_1m_out": 5, "cost_per_1m_in_cached": 0, @@ -1239,41 +1200,42 @@ "options": {} }, { - "id": "mistralai/magistral-medium-2506:thinking", - "name": "Mistral: Magistral Medium 2506 (thinking)", - "cost_per_1m_in": 2, - "cost_per_1m_out": 5, + "id": "mistralai/ministral-14b-2512", + "name": "Mistral: Ministral 3 14B 2512", + "cost_per_1m_in": 0.19999999999999998, + "cost_per_1m_out": 0.19999999999999998, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 40960, - "default_max_tokens": 20000, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false, + "context_window": 262144, + "default_max_tokens": 26214, + "can_reason": false, + "supports_attachments": true, "options": {} }, { - "id": "mistralai/magistral-small-2506", - "name": "Mistral: Magistral Small 2506", - "cost_per_1m_in": 0.5, - "cost_per_1m_out": 1.5, + "id": "mistralai/ministral-3b-2512", + "name": "Mistral: Ministral 3 3B 2512", + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.09999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 40000, - "default_max_tokens": 20000, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false, + "context_window": 131072, + "default_max_tokens": 13107, + "can_reason": false, + "supports_attachments": true, + "options": {} + }, + { + "id": "mistralai/ministral-8b-2512", + "name": "Mistral: Ministral 3 8B 2512", + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.15, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 262144, + "default_max_tokens": 26214, + "can_reason": false, + "supports_attachments": true, "options": {} }, { @@ -1383,12 +1345,12 @@ { "id": "mistralai/mistral-small-24b-instruct-2501", "name": "Mistral: Mistral Small 3", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.7999999999999999, + "cost_per_1m_out": 0.7999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 32768, - "default_max_tokens": 3276, + "default_max_tokens": 1024, "can_reason": false, "supports_attachments": false, "options": {} @@ -1396,12 +1358,12 @@ { "id": "mistralai/mistral-small-3.1-24b-instruct", "name": "Mistral: Mistral Small 3.1 24B", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.03, + "cost_per_1m_out": 0.11, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 65536, "can_reason": false, "supports_attachments": true, "options": {} @@ -1458,6 +1420,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "mistralai/pixtral-12b", + "name": "Mistral: Pixtral 12B", + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.15, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 13107, + "can_reason": false, + "supports_attachments": true, + "options": {} + }, { "id": "mistralai/pixtral-large-2411", "name": "Mistral: Pixtral Large 2411", @@ -1539,12 +1514,12 @@ { "id": "moonshotai/kimi-k2-thinking", "name": "MoonshotAI: Kimi K2 Thinking", - "cost_per_1m_in": 0.47, - "cost_per_1m_out": 2, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.14100000000000001, + "cost_per_1m_out_cached": 0.15, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -1609,8 +1584,8 @@ { "id": "nvidia/nemotron-nano-9b-v2", "name": "NVIDIA: Nemotron Nano 9B V2", - "cost_per_1m_in": 0.06, - "cost_per_1m_out": 0.25, + "cost_per_1m_in": 0.04, + "cost_per_1m_out": 0.16, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, @@ -2003,9 +1978,9 @@ "cost_per_1m_in": 0.049999999999999996, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.01, + "cost_per_1m_out_cached": 0.005, "context_window": 400000, - "default_max_tokens": 40000, + "default_max_tokens": 64000, "can_reason": true, "reasoning_levels": [ "low", @@ -2108,12 +2083,12 @@ { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", - "cost_per_1m_in": 0.09, - "cost_per_1m_out": 0.36, + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.49, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -2146,8 +2121,8 @@ { "id": "openai/gpt-oss-20b", "name": "OpenAI: gpt-oss-20b", - "cost_per_1m_in": 0.049999999999999996, - "cost_per_1m_out": 0.19999999999999998, + "cost_per_1m_in": 0.04, + "cost_per_1m_out": 0.15, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, @@ -2529,12 +2504,12 @@ { "id": "qwen/qwen3-235b-a22b-2507", "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.09999999999999999, + "cost_per_1m_in": 0.25, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false, "options": {} @@ -2542,7 +2517,7 @@ { "id": "qwen/qwen3-235b-a22b-thinking-2507", "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "cost_per_1m_in": 0.11, + "cost_per_1m_in": 0.13, "cost_per_1m_out": 0.6, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, @@ -2580,8 +2555,8 @@ { "id": "qwen/qwen3-30b-a3b-instruct-2507", "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "cost_per_1m_in": 0.09, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.08, + "cost_per_1m_out": 0.33, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2631,12 +2606,12 @@ { "id": "qwen/qwen3-coder-30b-a3b-instruct", "name": "Qwen: Qwen3 Coder 30B A3B Instruct", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.06, + "cost_per_1m_out": 0.25, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false, "options": {} @@ -2644,12 +2619,12 @@ { "id": "qwen/qwen3-coder", "name": "Qwen: Qwen3 Coder 480B A35B", - "cost_per_1m_in": 0.29, - "cost_per_1m_out": 1.2, + "cost_per_1m_in": 1, + "cost_per_1m_out": 1.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false, "options": {} @@ -2728,8 +2703,8 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.14, - "cost_per_1m_out": 1.4, + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2741,8 +2716,8 @@ { "id": "qwen/qwen3-next-80b-a3b-thinking", "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2760,12 +2735,12 @@ { "id": "qwen/qwen3-vl-235b-a22b-instruct", "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "cost_per_1m_in": 0.22, - "cost_per_1m_out": 0.88, + "cost_per_1m_in": 0.21, + "cost_per_1m_out": 1.9, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 26214, + "context_window": 131072, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": true, "options": {} @@ -2959,7 +2934,7 @@ "id": "alibaba/tongyi-deepresearch-30b-a3b", "name": "Tongyi DeepResearch 30B A3B", "cost_per_1m_in": 0.09, - "cost_per_1m_out": 0.44999999999999996, + "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, @@ -3009,12 +2984,12 @@ { "id": "z-ai/glm-4.5", "name": "Z.AI: GLM 4.5", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.2, + "cost_per_1m_in": 0.48, + "cost_per_1m_out": 1.76, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, + "cost_per_1m_out_cached": 0.088, "context_window": 131072, - "default_max_tokens": 48000, + "default_max_tokens": 49152, "can_reason": true, "reasoning_levels": [ "low", @@ -3085,12 +3060,12 @@ { "id": "z-ai/glm-4.6", "name": "Z.AI: GLM 4.6", - "cost_per_1m_in": 0.5, - "cost_per_1m_out": 1.9, + "cost_per_1m_in": 0.44, + "cost_per_1m_out": 1.76, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.088, "context_window": 204800, - "default_max_tokens": 102400, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -3104,12 +3079,12 @@ { "id": "z-ai/glm-4.6:exacto", "name": "Z.AI: GLM 4.6 (exacto)", - "cost_per_1m_in": 0.44, - "cost_per_1m_out": 1.76, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 204800, - "default_max_tokens": 65536, + "context_window": 200000, + "default_max_tokens": 64000, "can_reason": true, "reasoning_levels": [ "low", @@ -3123,10 +3098,10 @@ { "id": "x-ai/grok-3", "name": "xAI: Grok 3", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -3136,10 +3111,10 @@ { "id": "x-ai/grok-3-beta", "name": "xAI: Grok 3 Beta", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -3149,10 +3124,10 @@ { "id": "x-ai/grok-3-mini", "name": "xAI: Grok 3 Mini", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.5, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.075, + "cost_per_1m_out_cached": 0.15, "context_window": 131072, "default_max_tokens": 13107, "can_reason": true, @@ -3168,10 +3143,10 @@ { "id": "x-ai/grok-3-mini-beta", "name": "xAI: Grok 3 Mini Beta", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.5, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.075, + "cost_per_1m_out_cached": 0.15, "context_window": 131072, "default_max_tokens": 13107, "can_reason": true, diff --git a/internal/providers/configs/synthetic.json b/internal/providers/configs/synthetic.json index 024c706a13bf2bc7747e1ba0f265c6832dcce5fa..5fb81c7b4062b59426fa7194f3aa7702f42dc518 100644 --- a/internal/providers/configs/synthetic.json +++ b/internal/providers/configs/synthetic.json @@ -109,6 +109,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "hf:deepseek-ai/DeepSeek-V3.2", + "name": "DeepSeek V3.2", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 162816, + "default_max_tokens": 16281, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "hf:zai-org/GLM-4.5", "name": "GLM 4.5",