From 5e2ed4f0ff59c7b5ae8381e0f619859ce69fef34 Mon Sep 17 00:00:00 2001 From: Charm <124303983+charmcli@users.noreply.github.com> Date: Tue, 3 Mar 2026 03:05:50 +0000 Subject: [PATCH] chore: auto-update generated files --- internal/providers/configs/aihubmix.json | 189 +++++++++++++++- internal/providers/configs/huggingface.json | 39 ++-- internal/providers/configs/openrouter.json | 229 ++++++++++---------- 3 files changed, 330 insertions(+), 127 deletions(-) diff --git a/internal/providers/configs/aihubmix.json b/internal/providers/configs/aihubmix.json index e42e0fbcbf82f926aab60c9228180fe5b8756aba..79d991b457dbbd85e2c6ad685569e83ec1294eeb 100644 --- a/internal/providers/configs/aihubmix.json +++ b/internal/providers/configs/aihubmix.json @@ -582,6 +582,25 @@ "supports_attachments": false, "options": {} }, + { + "id": "coding-minimax-m2.1-free", + "name": "Coding MiniMax M2.1 (free)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 13100, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, { "id": "coding-minimax-m2.5", "name": "Coding MiniMax M2.5", @@ -601,6 +620,25 @@ "supports_attachments": false, "options": {} }, + { + "id": "coding-minimax-m2.5-free", + "name": "Coding MiniMax M2.5 (free)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 13100, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, { "id": "coding-minimax-m2.5-highspeed", "name": "Coding MiniMax M2.5 Highspeed", @@ -648,7 +686,13 @@ "cost_per_1m_out_cached": 0.0302, "context_window": 128000, "default_max_tokens": 64000, - "can_reason": false, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", "supports_attachments": false, "options": {} }, @@ -661,7 +705,13 @@ "cost_per_1m_out_cached": 1.096, "context_window": 128000, "default_max_tokens": 12800, - "can_reason": false, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", "supports_attachments": false, "options": {} }, @@ -693,7 +743,13 @@ "cost_per_1m_out_cached": 0.0302, "context_window": 128000, "default_max_tokens": 64000, - "can_reason": false, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", "supports_attachments": false, "options": {} }, @@ -1305,6 +1361,25 @@ "supports_attachments": false, "options": {} }, + { + "id": "glm-5", + "name": "GLM 5", + "cost_per_1m_in": 0.88, + "cost_per_1m_out": 2.816, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0.176, + "context_window": 202752, + "default_max_tokens": 20275, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, { "id": "gpt-4.1", "name": "GPT 4.1", @@ -1887,6 +1962,38 @@ "supports_attachments": true, "options": {} }, + { + "id": "grok-4-fast-non-reasoning", + "name": "Grok 4 Fast", + "cost_per_1m_in": 0.2, + "cost_per_1m_out": 0.5, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0.05, + "context_window": 2000000, + "default_max_tokens": 30000, + "can_reason": false, + "supports_attachments": true, + "options": {} + }, + { + "id": "grok-4-fast-reasoning", + "name": "Grok 4 Fast (reasoning)", + "cost_per_1m_in": 0.2, + "cost_per_1m_out": 0.5, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0.05, + "context_window": 2000000, + "default_max_tokens": 30000, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": true, + "options": {} + }, { "id": "grok-code-fast-1", "name": "Grok Code Fast 1", @@ -2060,6 +2167,82 @@ "supports_attachments": false, "options": {} }, + { + "id": "minimax-m2", + "name": "MiniMax M2", + "cost_per_1m_in": 0.288, + "cost_per_1m_out": 1.152, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 20480, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, + { + "id": "minimax-m2.1", + "name": "MiniMax M2.1", + "cost_per_1m_in": 0.288, + "cost_per_1m_out": 1.152, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 20480, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, + { + "id": "minimax-m2.5", + "name": "MiniMax M2.5", + "cost_per_1m_in": 0.288, + "cost_per_1m_out": 1.152, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 20480, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, + { + "id": "minimax-m2.5-highspeed", + "name": "MiniMax M2.5 Highspeed", + "cost_per_1m_in": 0.288, + "cost_per_1m_out": 1.152, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 20480, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, { "id": "mistral-large-3", "name": "Mistral Large 3", diff --git a/internal/providers/configs/huggingface.json b/internal/providers/configs/huggingface.json index 2b6220fbc00f6bbb1ad6d42b419874e2e16904da..6256bab6cbce3d48382a378dd38a945eb10108e9 100644 --- a/internal/providers/configs/huggingface.json +++ b/internal/providers/configs/huggingface.json @@ -46,6 +46,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "deepseek-ai/DeepSeek-V3.2:fireworks-ai", + "name": "deepseek-ai/DeepSeek-V3.2 (fireworks-ai)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 163840, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "meta-llama/Llama-3.3-70B-Instruct:groq", "name": "meta-llama/Llama-3.3-70B-Instruct (groq)", @@ -59,6 +72,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct:groq", + "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct (groq)", + "cost_per_1m_in": 0.2, + "cost_per_1m_out": 0.6, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct:groq", "name": "meta-llama/Llama-4-Scout-17B-16E-Instruct (groq)", @@ -162,19 +188,6 @@ "can_reason": false, "supports_attachments": false, "options": {} - }, - { - "id": "zai-org/GLM-5:fireworks-ai", - "name": "zai-org/GLM-5 (fireworks-ai)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 202752, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false, - "options": {} } ], "default_headers": { diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index 773cbb8f1ad0ac20e8c576ad982bfb16336d4373..5fb15ec47e7114524cb42214bc6b6a8b471c5148 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -346,25 +346,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "arcee-ai/trinity-mini", - "name": "Arcee AI: Trinity Mini", - "cost_per_1m_in": 0.045, - "cost_per_1m_out": 0.15, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 65536, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false, - "options": {} - }, { "id": "arcee-ai/trinity-mini:free", "name": "Arcee AI: Trinity Mini (free)", @@ -603,7 +584,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.13, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -622,7 +603,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.27, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 81920, "can_reason": true, "reasoning_levels": [ "low", @@ -655,12 +636,12 @@ { "id": "deepseek/deepseek-r1-0528", "name": "DeepSeek: R1 0528", - "cost_per_1m_in": 0.44999999999999996, - "cost_per_1m_out": 2.1500000000000004, + "cost_per_1m_in": 0.7, + "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.22499999999999998, + "cost_per_1m_out_cached": 0.35, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -671,6 +652,19 @@ "supports_attachments": false, "options": {} }, + { + "id": "essentialai/rnj-1-instruct", + "name": "EssentialAI: Rnj 1 Instruct", + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.15, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 32768, + "default_max_tokens": 3276, + "can_reason": false, + "supports_attachments": false, + "options": {} + }, { "id": "google/gemini-2.0-flash-001", "name": "Google: Gemini 2.0 Flash", @@ -900,6 +894,19 @@ "supports_attachments": true, "options": {} }, + { + "id": "google/gemma-3-27b-it:free", + "name": "Google: Gemma 3 27B (free)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 64000, + "can_reason": false, + "supports_attachments": true, + "options": {} + }, { "id": "inception/mercury", "name": "Inception: Mercury", @@ -947,7 +954,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.19999999999999998, "context_window": 131072, - "default_max_tokens": 16384, + "default_max_tokens": 65536, "can_reason": false, "supports_attachments": false, "options": {} @@ -981,12 +988,12 @@ { "id": "meta-llama/llama-3.3-70b-instruct", "name": "Meta: Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.59, - "cost_per_1m_out": 0.7899999999999999, + "cost_per_1m_in": 0.135, + "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 16384, + "default_max_tokens": 60000, "can_reason": false, "supports_attachments": false, "options": {} @@ -1007,12 +1014,12 @@ { "id": "meta-llama/llama-4-maverick", "name": "Meta: Llama 4 Maverick", - "cost_per_1m_in": 0.35, - "cost_per_1m_out": 1.15, + "cost_per_1m_in": 0.27, + "cost_per_1m_out": 0.85, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 524288, - "default_max_tokens": 4096, + "context_window": 1048576, + "default_max_tokens": 104857, "can_reason": false, "supports_attachments": true, "options": {} @@ -1033,10 +1040,10 @@ { "id": "minimax/minimax-m2", "name": "MiniMax: MiniMax M2", - "cost_per_1m_in": 0.255, - "cost_per_1m_out": 1.02, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.03, "context_window": 204800, "default_max_tokens": 65536, "can_reason": true, @@ -1055,9 +1062,9 @@ "cost_per_1m_in": 0.3, "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.03, + "cost_per_1m_out_cached": 0.029, "context_window": 204800, - "default_max_tokens": 65536, + "default_max_tokens": 20480, "can_reason": true, "reasoning_levels": [ "low", @@ -1392,7 +1399,7 @@ "cost_per_1m_in": 0.6, "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0.3, "context_window": 262144, "default_max_tokens": 26214, "can_reason": false, @@ -1435,11 +1442,11 @@ "id": "moonshotai/kimi-k2.5", "name": "MoonshotAI: Kimi K2.5", "cost_per_1m_in": 0.6, - "cost_per_1m_out": 3, + "cost_per_1m_out": 2.8, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.1, + "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -1661,9 +1668,9 @@ "cost_per_1m_in": 0.09999999999999999, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.03, + "cost_per_1m_out_cached": 0.024999999999999998, "context_window": 1047576, - "default_max_tokens": 104757, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": true, "options": {} @@ -1930,9 +1937,9 @@ "cost_per_1m_in": 1.25, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.125, + "cost_per_1m_out_cached": 0.13, "context_window": 128000, - "default_max_tokens": 8192, + "default_max_tokens": 16000, "can_reason": false, "supports_attachments": true, "options": {} @@ -1981,9 +1988,9 @@ "cost_per_1m_in": 0.25, "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.024999999999999998, + "cost_per_1m_out_cached": 0.03, "context_window": 400000, - "default_max_tokens": 50000, + "default_max_tokens": 64000, "can_reason": true, "reasoning_levels": [ "low", @@ -2086,12 +2093,12 @@ { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", - "cost_per_1m_in": 0.049999999999999996, - "cost_per_1m_out": 0.44999999999999996, + "cost_per_1m_in": 0.039, + "cost_per_1m_out": 0.19, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.024999999999999998, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 32768, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -2105,12 +2112,12 @@ { "id": "openai/gpt-oss-120b:exacto", "name": "OpenAI: gpt-oss-120b (exacto)", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 0.6, + "cost_per_1m_in": 0.039, + "cost_per_1m_out": 0.19, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.075, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 32768, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -2143,10 +2150,10 @@ { "id": "openai/gpt-oss-20b", "name": "OpenAI: gpt-oss-20b", - "cost_per_1m_in": 0.03, - "cost_per_1m_out": 0.14, + "cost_per_1m_in": 0.07, + "cost_per_1m_out": 0.3, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.035, "context_window": 131072, "default_max_tokens": 13107, "can_reason": true, @@ -2533,12 +2540,12 @@ { "id": "qwen/qwen3-235b-a22b-thinking-2507", "name": "Qwen: Qwen3 235B A22B Thinking 2507", - "cost_per_1m_in": 0.11, - "cost_per_1m_out": 0.6, + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.055, - "context_window": 262144, - "default_max_tokens": 131072, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -2552,12 +2559,12 @@ { "id": "qwen/qwen3-30b-a3b", "name": "Qwen: Qwen3 30B A3B", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 0.6, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.52, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 4096, "can_reason": true, "reasoning_levels": [ "low", @@ -2661,11 +2668,11 @@ "id": "qwen/qwen3-coder-30b-a3b-instruct", "name": "Qwen: Qwen3 Coder 30B A3B Instruct", "cost_per_1m_in": 0.07, - "cost_per_1m_out": 0.27, + "cost_per_1m_out": 0.28, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 160000, - "default_max_tokens": 16384, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false, "options": {} @@ -2725,12 +2732,12 @@ { "id": "qwen/qwen3-coder-next", "name": "Qwen: Qwen3 Coder Next", - "cost_per_1m_in": 0.18, - "cost_per_1m_out": 1.35, + "cost_per_1m_in": 0.12, + "cost_per_1m_out": 0.75, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.18, + "cost_per_1m_out_cached": 0.06, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 32768, "can_reason": false, "supports_attachments": false, "options": {} @@ -2783,8 +2790,8 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 1.1, + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2809,8 +2816,8 @@ { "id": "qwen/qwen3-next-80b-a3b-thinking", "name": "Qwen: Qwen3 Next 80B A3B Thinking", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2841,12 +2848,12 @@ { "id": "qwen/qwen3-vl-235b-a22b-thinking", "name": "Qwen: Qwen3 VL 235B A22B Thinking", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, + "cost_per_1m_in": 0.44999999999999996, + "cost_per_1m_out": 3.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 16384, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -2873,12 +2880,12 @@ { "id": "qwen/qwen3-vl-30b-a3b-thinking", "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, + "cost_per_1m_in": 0.29, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 16384, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -3014,11 +3021,11 @@ "id": "qwen/qwen3.5-35b-a3b", "name": "Qwen: Qwen3.5-35B-A3B", "cost_per_1m_in": 0.25, - "cost_per_1m_out": 2, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -3164,12 +3171,12 @@ "options": {} }, { - "id": "upstage/solar-pro-3:free", - "name": "Upstage: Solar Pro 3 (free)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, + "id": "upstage/solar-pro-3", + "name": "Upstage: Solar Pro 3", + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.6, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.015, "context_window": 128000, "default_max_tokens": 12800, "can_reason": true, @@ -3188,7 +3195,7 @@ "cost_per_1m_in": 0.09999999999999999, "cost_per_1m_out": 0.3, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.09999999999999999, + "cost_per_1m_out_cached": 0.01, "context_window": 262144, "default_max_tokens": 32768, "can_reason": true, @@ -3293,12 +3300,12 @@ { "id": "z-ai/glm-4.6", "name": "Z.ai: GLM 4.6", - "cost_per_1m_in": 0.55, - "cost_per_1m_out": 2.2, + "cost_per_1m_in": 0.39, + "cost_per_1m_out": 1.9, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, + "cost_per_1m_out_cached": 0, "context_window": 204800, - "default_max_tokens": 65536, + "default_max_tokens": 102400, "can_reason": true, "reasoning_levels": [ "low", @@ -3312,12 +3319,12 @@ { "id": "z-ai/glm-4.6:exacto", "name": "Z.ai: GLM 4.6 (exacto)", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.2, + "cost_per_1m_in": 0.44, + "cost_per_1m_out": 1.76, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.11, - "context_window": 200000, - "default_max_tokens": 64000, + "context_window": 204800, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -3369,10 +3376,10 @@ { "id": "z-ai/glm-4.7-flash", "name": "Z.ai: GLM 4.7 Flash", - "cost_per_1m_in": 0.06, - "cost_per_1m_out": 0.39999999999999997, + "cost_per_1m_in": 0.09999999999999999, + "cost_per_1m_out": 0.43, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.0100000002, + "cost_per_1m_out_cached": 0, "context_window": 202752, "default_max_tokens": 20275, "can_reason": true, @@ -3407,10 +3414,10 @@ { "id": "x-ai/grok-3", "name": "xAI: Grok 3", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -3420,10 +3427,10 @@ { "id": "x-ai/grok-3-beta", "name": "xAI: Grok 3 Beta", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false,