diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index 0ac688e69ef7ee4d54347040fd024d26ae1e0382..6f03e4884c83e9d1b53956b9747801333363befa 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -508,8 +508,8 @@ "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 163840, - "default_max_tokens": 16384, + "context_window": 131072, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -660,7 +660,7 @@ "cost_per_1m_in": 0.09999999999999999, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0.18330000000000002, - "cost_per_1m_out_cached": 0.01, + "cost_per_1m_out_cached": 0.024999999999999998, "context_window": 1048576, "default_max_tokens": 32767, "can_reason": true, @@ -681,7 +681,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 1048576, - "default_max_tokens": 32767, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -787,19 +787,6 @@ "supports_attachments": true, "options": {} }, - { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "cost_per_1m_in": 0.13, - "cost_per_1m_out": 0.52, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 96000, - "default_max_tokens": 48000, - "can_reason": false, - "supports_attachments": true, - "options": {} - }, { "id": "inception/mercury", "name": "Inception: Mercury", @@ -852,6 +839,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "meta-llama/llama-3.1-405b-instruct", + "name": "Meta: Llama 3.1 405B Instruct", + "cost_per_1m_in": 3.5, + "cost_per_1m_out": 3.5, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 130815, + "default_max_tokens": 13081, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "meta-llama/llama-3.1-70b-instruct", "name": "Meta: Llama 3.1 70B Instruct", @@ -868,12 +868,12 @@ { "id": "meta-llama/llama-3.1-8b-instruct", "name": "Meta: Llama 3.1 8B Instruct", - "cost_per_1m_in": 0.02, - "cost_per_1m_out": 0.03, + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.09999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 8192, + "default_max_tokens": 4000, "can_reason": false, "supports_attachments": false, "options": {} @@ -1357,6 +1357,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "mistralai/pixtral-12b", + "name": "Mistral: Pixtral 12B", + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.15, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 13107, + "can_reason": false, + "supports_attachments": true, + "options": {} + }, { "id": "mistralai/pixtral-large-2411", "name": "Mistral: Pixtral Large 2411", @@ -1399,12 +1412,12 @@ { "id": "moonshotai/kimi-k2", "name": "MoonshotAI: Kimi K2 0711", - "cost_per_1m_in": 1, - "cost_per_1m_out": 3, + "cost_per_1m_in": 0.5, + "cost_per_1m_out": 2.4, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 13107, "can_reason": false, "supports_attachments": false, "options": {} @@ -1412,12 +1425,12 @@ { "id": "moonshotai/kimi-k2-0905", "name": "MoonshotAI: Kimi K2 0905", - "cost_per_1m_in": 1, - "cost_per_1m_out": 3, + "cost_per_1m_in": 0.5, + "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.5, + "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 8192, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} @@ -1425,12 +1438,12 @@ { "id": "moonshotai/kimi-k2-0905:exacto", "name": "MoonshotAI: Kimi K2 0905 (exacto)", - "cost_per_1m_in": 1, - "cost_per_1m_out": 3, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 8192, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} @@ -1647,7 +1660,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.5, "context_window": 1047576, - "default_max_tokens": 16384, + "default_max_tokens": 104757, "can_reason": false, "supports_attachments": true, "options": {} @@ -1883,9 +1896,9 @@ "cost_per_1m_in": 0.049999999999999996, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.005, + "cost_per_1m_out_cached": 0.01, "context_window": 400000, - "default_max_tokens": 64000, + "default_max_tokens": 40000, "can_reason": true, "reasoning_levels": [ "low", @@ -2008,11 +2021,11 @@ "id": "openai/gpt-oss-120b:exacto", "name": "OpenAI: gpt-oss-120b (exacto)", "cost_per_1m_in": 0.049999999999999996, - "cost_per_1m_out": 0.24, + "cost_per_1m_out": 0.25, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -2330,6 +2343,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "qwen/qwen-2.5-7b-instruct", + "name": "Qwen: Qwen2.5 7B Instruct", + "cost_per_1m_in": 0.07, + "cost_per_1m_out": 0.07, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32000, + "default_max_tokens": 16000, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "qwen/qwen3-14b", "name": "Qwen: Qwen3 14B", @@ -2390,12 +2416,12 @@ { "id": "qwen/qwen3-235b-a22b-2507", "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.09999999999999999, + "cost_per_1m_in": 0.25, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false, "options": {} @@ -2403,12 +2429,12 @@ { "id": "qwen/qwen3-235b-a22b-thinking-2507", "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "cost_per_1m_in": 0.65, - "cost_per_1m_out": 3, + "cost_per_1m_in": 0.11, + "cost_per_1m_out": 0.6, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -2441,16 +2467,35 @@ { "id": "qwen/qwen3-30b-a3b-instruct-2507", "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "cost_per_1m_in": 0.08, - "cost_per_1m_out": 0.33, + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.3, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} }, + { + "id": "qwen/qwen3-30b-a3b-thinking-2507", + "name": "Qwen: Qwen3 30B A3B Thinking 2507", + "cost_per_1m_in": 0.19999999999999998, + "cost_per_1m_out": 2.4, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 16384, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, { "id": "qwen/qwen3-32b", "name": "Qwen: Qwen3 32B", @@ -2524,8 +2569,8 @@ { "id": "qwen/qwen3-coder", "name": "Qwen: Qwen3 Coder 480B A35B", - "cost_per_1m_in": 0.29, - "cost_per_1m_out": 1.2, + "cost_per_1m_in": 0.39999999999999997, + "cost_per_1m_out": 1.5999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2608,12 +2653,12 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.14, - "cost_per_1m_out": 1.1, + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.7999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false, "options": {} @@ -2640,12 +2685,12 @@ { "id": "qwen/qwen3-vl-235b-a22b-instruct", "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "cost_per_1m_in": 0.39999999999999997, - "cost_per_1m_out": 1.5999999999999999, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 16384, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": true, "options": {} @@ -2801,7 +2846,7 @@ "id": "alibaba/tongyi-deepresearch-30b-a3b", "name": "Tongyi DeepResearch 30B A3B", "cost_per_1m_in": 0.09, - "cost_per_1m_out": 0.39999999999999997, + "cost_per_1m_out": 0.44999999999999996, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, @@ -2851,12 +2896,12 @@ { "id": "z-ai/glm-4.5", "name": "Z.AI: GLM 4.5", - "cost_per_1m_in": 0.35, - "cost_per_1m_out": 1.55, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.11, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 49152, "can_reason": true, "reasoning_levels": [ "low", @@ -2870,12 +2915,12 @@ { "id": "z-ai/glm-4.5-air", "name": "Z.AI: GLM 4.5 Air", - "cost_per_1m_in": 0.19999999999999998, - "cost_per_1m_out": 1.1, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.85, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.03, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 48000, + "default_max_tokens": 49152, "can_reason": true, "reasoning_levels": [ "low", @@ -2908,12 +2953,12 @@ { "id": "z-ai/glm-4.5v", "name": "Z.AI: GLM 4.5V", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 1.7999999999999998, + "cost_per_1m_in": 1.1, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, + "cost_per_1m_out_cached": 0, "context_window": 65536, - "default_max_tokens": 8192, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -2946,12 +2991,12 @@ { "id": "z-ai/glm-4.6:exacto", "name": "Z.AI: GLM 4.6 (exacto)", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.2, + "cost_per_1m_in": 0.44999999999999996, + "cost_per_1m_out": 1.9, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 204800, - "default_max_tokens": 65536, + "context_window": 202752, + "default_max_tokens": 20275, "can_reason": true, "reasoning_levels": [ "low", @@ -2965,10 +3010,10 @@ { "id": "x-ai/grok-3", "name": "xAI: Grok 3", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -2978,10 +3023,10 @@ { "id": "x-ai/grok-3-beta", "name": "xAI: Grok 3 Beta", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false,