From a963b8c8c2d0885363e4620270941e48895cf50f Mon Sep 17 00:00:00 2001 From: Charm <124303983+charmcli@users.noreply.github.com> Date: Thu, 9 Apr 2026 03:09:48 +0000 Subject: [PATCH] chore: auto-update generated files --- internal/providers/configs/avian.json | 2 +- internal/providers/configs/chutes.json | 18 ++ internal/providers/configs/huggingface.json | 36 ++++ internal/providers/configs/ionet.json | 2 +- internal/providers/configs/openrouter.json | 220 +++++++------------- internal/providers/configs/venice.json | 128 +++++++++++- internal/providers/configs/vercel.json | 12 -- 7 files changed, 257 insertions(+), 161 deletions(-) diff --git a/internal/providers/configs/avian.json b/internal/providers/configs/avian.json index 87f805414d5dc9157ec15225f99044309c2bfaee..558aaa5f2cd21222cdf78e7d1429f66ec83dc0a4 100644 --- a/internal/providers/configs/avian.json +++ b/internal/providers/configs/avian.json @@ -42,7 +42,7 @@ "name": "GLM-5.1", "cost_per_1m_in": 1, "cost_per_1m_out": 3.2, - "cost_per_1m_in_cached": 0, + "cost_per_1m_in_cached": 0.2, "cost_per_1m_out_cached": 0, "context_window": 202752, "default_max_tokens": 202752, diff --git a/internal/providers/configs/chutes.json b/internal/providers/configs/chutes.json index f836e90ade1e248112347e3bab8321452cd2e2b4..14ec43c2ed74ada3afb02fdd0400f40f108b0d63 100644 --- a/internal/providers/configs/chutes.json +++ b/internal/providers/configs/chutes.json @@ -265,6 +265,24 @@ "default_reasoning_effort": "medium", "supports_attachments": false }, + { + "id": "zai-org/GLM-5.1-TEE", + "name": "GLM-5.1-TEE", + "cost_per_1m_in": 0.95, + "cost_per_1m_out": 3.15, + "cost_per_1m_in_cached": 0.475, + "cost_per_1m_out_cached": 0, + "context_window": 202752, + "default_max_tokens": 65535, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false + }, { "id": "NousResearch/Hermes-4-14B", "name": "Hermes-4-14B", diff --git a/internal/providers/configs/huggingface.json b/internal/providers/configs/huggingface.json index 082fbff22f289394900145503470a98b0281b5bc..8538eeace5cc6217656fea1f526a17b145be877f 100644 --- a/internal/providers/configs/huggingface.json +++ b/internal/providers/configs/huggingface.json @@ -7,6 +7,30 @@ "default_large_model_id": "moonshotai/Kimi-K2.5:fireworks-ai", "default_small_model_id": "openai/gpt-oss-20b:groq", "models": [ + { + "id": "MiniMaxAI/MiniMax-M2.1:fireworks-ai", + "name": "MiniMaxAI/MiniMax-M2.1 (fireworks-ai)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, + { + "id": "MiniMaxAI/MiniMax-M2.5:fireworks-ai", + "name": "MiniMaxAI/MiniMax-M2.5 (fireworks-ai)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 204800, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false + }, { "id": "Qwen/Qwen3-235B-A22B-Instruct-2507:cerebras", "name": "Qwen/Qwen3-235B-A22B-Instruct-2507 (cerebras)", @@ -258,6 +282,18 @@ "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false + }, + { + "id": "zai-org/GLM-5.1:fireworks-ai", + "name": "zai-org/GLM-5.1 (fireworks-ai)", + "cost_per_1m_in": 0, + "cost_per_1m_out": 0, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 202752, + "default_max_tokens": 8192, + "can_reason": false, + "supports_attachments": false } ], "default_headers": { diff --git a/internal/providers/configs/ionet.json b/internal/providers/configs/ionet.json index d9c2d5a55ca54769390a504beec73ca17b452416..9eb44d5ef2a2fe882756b090ac5cfd1d3666b242 100644 --- a/internal/providers/configs/ionet.json +++ b/internal/providers/configs/ionet.json @@ -232,7 +232,7 @@ { "id": "zai-org/GLM-5.1", "name": "Z.ai: GLM 5.1", - "cost_per_1m_in": 1.4, + "cost_per_1m_in": 1.395, "cost_per_1m_out": 4.4, "cost_per_1m_in_cached": 0.26, "cost_per_1m_out_cached": 0, diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index f5ba4e712f8d65a457236f4e7c3db16a5622343a..596bdf07ead4ad95b30596541e7988e9583e8e12 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -607,9 +607,9 @@ "cost_per_1m_in": 0.27, "cost_per_1m_out": 0.41, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.27, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 81920, "can_reason": true, "reasoning_levels": [ "low", @@ -874,12 +874,12 @@ { "id": "google/gemma-4-26b-a4b-it", "name": "Google: Gemma 4 26B A4B ", - "cost_per_1m_in": 0.13, - "cost_per_1m_out": 0.4, + "cost_per_1m_in": 0.1625, + "cost_per_1m_out": 0.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 65536, + "context_window": 256000, + "default_max_tokens": 4096, "can_reason": true, "reasoning_levels": [ "low", @@ -992,8 +992,8 @@ "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.06, - "context_window": 256000, - "default_max_tokens": 40000, + "context_window": 262144, + "default_max_tokens": 72000, "can_reason": false, "supports_attachments": false }, @@ -1024,12 +1024,12 @@ { "id": "meta-llama/llama-3.3-70b-instruct", "name": "Meta: Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.25, - "cost_per_1m_out": 0.75, + "cost_per_1m_in": 0.135, + "cost_per_1m_out": 0.4, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 60000, "can_reason": false, "supports_attachments": false }, @@ -1069,33 +1069,15 @@ "can_reason": false, "supports_attachments": true }, - { - "id": "minimax/minimax-m1", - "name": "MiniMax: MiniMax M1", - "cost_per_1m_in": 0.44, - "cost_per_1m_out": 1.76, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 1000000, - "default_max_tokens": 20000, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false - }, { "id": "minimax/minimax-m2", "name": "MiniMax: MiniMax M2", - "cost_per_1m_in": 0.255, - "cost_per_1m_out": 1, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.03, - "context_window": 196608, - "default_max_tokens": 98304, + "context_window": 204800, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -1126,12 +1108,12 @@ { "id": "minimax/minimax-m2.5", "name": "MiniMax: MiniMax M2.5", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.4, + "cost_per_1m_in": 0.34, + "cost_per_1m_out": 1.19, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.06, - "context_window": 204800, - "default_max_tokens": 65536, + "cost_per_1m_out_cached": 0.04, + "context_window": 198000, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -1276,12 +1258,12 @@ { "id": "mistralai/ministral-3b-2512", "name": "Mistral: Ministral 3 3B 2512", - "cost_per_1m_in": 0.1, - "cost_per_1m_out": 0.1, + "cost_per_1m_in": 0.35, + "cost_per_1m_out": 0.35, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.01, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 65536, "can_reason": false, "supports_attachments": true }, @@ -1462,24 +1444,24 @@ { "id": "moonshotai/kimi-k2-0905", "name": "MoonshotAI: Kimi K2 0905", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.5, + "cost_per_1m_in": 1, + "cost_per_1m_out": 3, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.5, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false }, { "id": "moonshotai/kimi-k2-thinking", "name": "MoonshotAI: Kimi K2 Thinking", - "cost_per_1m_in": 0.47, - "cost_per_1m_out": 2, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.141, - "context_window": 131072, - "default_max_tokens": 13107, + "cost_per_1m_out_cached": 0, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -1492,10 +1474,10 @@ { "id": "moonshotai/kimi-k2.5", "name": "MoonshotAI: Kimi K2.5", - "cost_per_1m_in": 0.45, - "cost_per_1m_out": 2.25, + "cost_per_1m_in": 0.44, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.07, + "cost_per_1m_out_cached": 0.22, "context_window": 262144, "default_max_tokens": 131072, "can_reason": true, @@ -1765,9 +1747,9 @@ "cost_per_1m_in": 0.1, "cost_per_1m_out": 0.4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.025, + "cost_per_1m_out_cached": 0.03, "context_window": 1047576, - "default_max_tokens": 16384, + "default_max_tokens": 104757, "can_reason": false, "supports_attachments": true }, @@ -1777,7 +1759,7 @@ "cost_per_1m_in": 2.5, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 8192, "can_reason": false, @@ -1999,7 +1981,7 @@ "cost_per_1m_in": 1.25, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.125, + "cost_per_1m_out_cached": 0.13, "context_window": 400000, "default_max_tokens": 64000, "can_reason": true, @@ -2248,12 +2230,12 @@ { "id": "openai/gpt-oss-120b", "name": "OpenAI: gpt-oss-120b", - "cost_per_1m_in": 0.09, - "cost_per_1m_out": 0.36, + "cost_per_1m_in": 0.039, + "cost_per_1m_out": 0.19, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.045, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 32768, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -2284,12 +2266,12 @@ { "id": "openai/gpt-oss-20b", "name": "OpenAI: gpt-oss-20b", - "cost_per_1m_in": 0.05, - "cost_per_1m_out": 0.2, + "cost_per_1m_in": 0.03, + "cost_per_1m_out": 0.14, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.05, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 13107, "can_reason": true, "reasoning_levels": [ "low", @@ -2635,24 +2617,6 @@ "can_reason": false, "supports_attachments": false }, - { - "id": "qwen/qwen3-14b", - "name": "Qwen: Qwen3 14B", - "cost_per_1m_in": 0.2275, - "cost_per_1m_out": 0.91, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 4096, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false - }, { "id": "qwen/qwen3-235b-a22b", "name": "Qwen: Qwen3 235B A22B", @@ -2674,12 +2638,12 @@ { "id": "qwen/qwen3-235b-a22b-2507", "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "cost_per_1m_in": 0.22, - "cost_per_1m_out": 0.88, + "cost_per_1m_in": 0.2, + "cost_per_1m_out": 0.8, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 8192, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false }, @@ -2704,12 +2668,12 @@ { "id": "qwen/qwen3-30b-a3b", "name": "Qwen: Qwen3 30B A3B", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 0.6, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.52, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 65536, + "default_max_tokens": 4096, "can_reason": true, "reasoning_levels": [ "low", @@ -2725,9 +2689,9 @@ "cost_per_1m_in": 0.1, "cost_per_1m_out": 0.3, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.1, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false }, @@ -2890,12 +2854,12 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 1.2, + "cost_per_1m_in": 0.09, + "cost_per_1m_out": 1.1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false }, @@ -2932,12 +2896,12 @@ { "id": "qwen/qwen3-vl-235b-a22b-instruct", "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "cost_per_1m_in": 0.26, - "cost_per_1m_out": 1.04, + "cost_per_1m_in": 0.25, + "cost_per_1m_out": 1.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 16384, + "context_window": 256000, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": true }, @@ -2962,12 +2926,12 @@ { "id": "qwen/qwen3-vl-30b-a3b-instruct", "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "cost_per_1m_in": 0.29, - "cost_per_1m_out": 1, + "cost_per_1m_in": 0.13, + "cost_per_1m_out": 0.52, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 131072, + "context_window": 131072, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": true }, @@ -3160,8 +3124,8 @@ { "id": "qwen/qwen3.6-plus", "name": "Qwen: Qwen3.6 Plus", - "cost_per_1m_in": 0.5, - "cost_per_1m_out": 3, + "cost_per_1m_in": 0.325, + "cost_per_1m_out": 1.95, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 1000000, @@ -3205,24 +3169,6 @@ "default_reasoning_effort": "medium", "supports_attachments": false }, - { - "id": "stepfun/step-3.5-flash:free", - "name": "StepFun: Step 3.5 Flash (free)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 256000, - "default_max_tokens": 128000, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false - }, { "id": "tngtech/deepseek-r1t2-chimera", "name": "TNG: DeepSeek R1T2 Chimera", @@ -3241,18 +3187,6 @@ "default_reasoning_effort": "medium", "supports_attachments": false }, - { - "id": "thedrummer/rocinante-12b", - "name": "TheDrummer: Rocinante 12B", - "cost_per_1m_in": 0.17, - "cost_per_1m_out": 0.43, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 16384, - "can_reason": false, - "supports_attachments": false - }, { "id": "thedrummer/unslopnemo-12b", "name": "TheDrummer: UnslopNemo 12B", @@ -3375,7 +3309,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.11, "context_window": 131072, - "default_max_tokens": 48000, + "default_max_tokens": 49152, "can_reason": true, "reasoning_levels": [ "low", @@ -3586,10 +3520,10 @@ { "id": "x-ai/grok-3", "name": "xAI: Grok 3", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -3598,10 +3532,10 @@ { "id": "x-ai/grok-3-beta", "name": "xAI: Grok 3 Beta", - "cost_per_1m_in": 5, - "cost_per_1m_out": 25, + "cost_per_1m_in": 3, + "cost_per_1m_out": 15, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0.75, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, diff --git a/internal/providers/configs/venice.json b/internal/providers/configs/venice.json index 49682b35db7fd9de6bbcf273162c21d9277d9614..f7dc787c4bc5a066f41c91ffbf509b4d465f8985 100644 --- a/internal/providers/configs/venice.json +++ b/internal/providers/configs/venice.json @@ -4,8 +4,8 @@ "api_key": "$VENICE_API_KEY", "api_endpoint": "https://api.venice.ai/api/v1", "type": "openai-compat", - "default_large_model_id": "claude-opus-4-6", - "default_small_model_id": "arcee-trinity-large-thinking", + "default_large_model_id": "claude-opus-4-6-fast", + "default_small_model_id": "mistral-small-2603", "models": [ { "id": "claude-opus-4-5", @@ -43,6 +43,24 @@ "default_reasoning_effort": "medium", "supports_attachments": true }, + { + "id": "claude-opus-4-6-fast", + "name": "Claude Opus 4.6 Fast", + "cost_per_1m_in": 36, + "cost_per_1m_out": 180, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 1000000, + "default_max_tokens": 128000, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": true + }, { "id": "claude-sonnet-4-5", "name": "Claude Sonnet 4.5", @@ -157,6 +175,24 @@ "can_reason": true, "supports_attachments": false }, + { + "id": "z-ai-glm-5-turbo", + "name": "GLM 5 Turbo", + "cost_per_1m_in": 1.2, + "cost_per_1m_out": 4, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 200000, + "default_max_tokens": 32768, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false + }, { "id": "zai-org-glm-5-1", "name": "GLM 5.1", @@ -169,6 +205,24 @@ "can_reason": true, "supports_attachments": false }, + { + "id": "z-ai-glm-5v-turbo", + "name": "GLM 5V Turbo", + "cost_per_1m_in": 1.5, + "cost_per_1m_out": 5, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 200000, + "default_max_tokens": 32768, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": true + }, { "id": "openai-gpt-4o-2024-11-20", "name": "GPT-4o", @@ -357,7 +411,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 256000, - "default_max_tokens": 12288, + "default_max_tokens": 8192, "can_reason": true, "supports_attachments": true }, @@ -369,7 +423,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 256000, - "default_max_tokens": 12288, + "default_max_tokens": 8192, "can_reason": true, "supports_attachments": true }, @@ -487,6 +541,24 @@ "can_reason": false, "supports_attachments": false }, + { + "id": "mercury-2", + "name": "Mercury 2", + "cost_per_1m_in": 0.3125, + "cost_per_1m_out": 0.9375, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 50000, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false + }, { "id": "minimax-m21", "name": "MiniMax M2.1", @@ -553,6 +625,24 @@ "can_reason": false, "supports_attachments": false }, + { + "id": "mistral-small-2603", + "name": "Mistral Small 4", + "cost_per_1m_in": 0.1875, + "cost_per_1m_out": 0.75, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 256000, + "default_max_tokens": 65536, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": true + }, { "id": "nvidia-nemotron-3-nano-30b-a3b", "name": "NVIDIA Nemotron 3 Nano 30B", @@ -565,6 +655,18 @@ "can_reason": false, "supports_attachments": false }, + { + "id": "nvidia-nemotron-cascade-2-30b-a3b", + "name": "Nemotron Cascade 2 30B A3B", + "cost_per_1m_in": 0.14, + "cost_per_1m_out": 0.8, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 256000, + "default_max_tokens": 32768, + "can_reason": true, + "supports_attachments": false + }, { "id": "openai-gpt-oss-120b", "name": "OpenAI GPT OSS 120B", @@ -653,6 +755,24 @@ "top_p": 0.95 } }, + { + "id": "qwen3-5-397b-a17b", + "name": "Qwen 3.5 397B", + "cost_per_1m_in": 0.75, + "cost_per_1m_out": 4.5, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 128000, + "default_max_tokens": 32768, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": true + }, { "id": "qwen3-5-9b", "name": "Qwen 3.5 9B", diff --git a/internal/providers/configs/vercel.json b/internal/providers/configs/vercel.json index a7e6579b3e9d315f702847328f3fa6e059f5bf62..b7bdf6aaafe4580452027f7aa751943e08df0344 100644 --- a/internal/providers/configs/vercel.json +++ b/internal/providers/configs/vercel.json @@ -1216,18 +1216,6 @@ "can_reason": false, "supports_attachments": true }, - { - "id": "xai/grok-2-vision", - "name": "Grok 2 Vision", - "cost_per_1m_in": 2, - "cost_per_1m_out": 10, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 8000, - "can_reason": false, - "supports_attachments": true - }, { "id": "xai/grok-3", "name": "Grok 3 Beta",