diff --git a/internal/providers/configs/huggingface.json b/internal/providers/configs/huggingface.json index 8c9c824797c3b69e0a414ca8671721e65b8b93d9..d3f3a8e4bf701c0d40a4fa07e067c55c173deede 100644 --- a/internal/providers/configs/huggingface.json +++ b/internal/providers/configs/huggingface.json @@ -7,19 +7,6 @@ "default_large_model_id": "moonshotai/Kimi-K2-Instruct-0905:groq", "default_small_model_id": "openai/gpt-oss-20b:groq", "models": [ - { - "id": "MiniMaxAI/MiniMax-M2.1:fireworks-ai", - "name": "MiniMaxAI/MiniMax-M2.1 (fireworks-ai)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 204800, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "MiniMaxAI/MiniMax-M2.5:fireworks-ai", "name": "MiniMaxAI/MiniMax-M2.5 (fireworks-ai)", @@ -46,19 +33,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "Qwen/Qwen3-8B:fireworks-ai", - "name": "Qwen/Qwen3-8B (fireworks-ai)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 40960, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "Qwen/Qwen3-VL-30B-A3B-Instruct:fireworks-ai", "name": "Qwen/Qwen3-VL-30B-A3B-Instruct (fireworks-ai)", @@ -150,19 +124,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "moonshotai/Kimi-K2-Instruct-0905:fireworks-ai", - "name": "moonshotai/Kimi-K2-Instruct-0905 (fireworks-ai)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "moonshotai/Kimi-K2-Instruct-0905:groq", "name": "moonshotai/Kimi-K2-Instruct-0905 (groq)", @@ -280,19 +241,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "zai-org/GLM-4.7:fireworks-ai", - "name": "zai-org/GLM-4.7 (fireworks-ai)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 202752, - "default_max_tokens": 8192, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, { "id": "zai-org/GLM-5:fireworks-ai", "name": "zai-org/GLM-5 (fireworks-ai)", diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index a0fa260fad21915ea1cc80f0b9c48b7c8e5a3e66..968a25ef7ade70cca5ed8a36105d73107b199c5c 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -151,7 +151,7 @@ "cost_per_1m_in_cached": 3.75, "cost_per_1m_out_cached": 0.3, "context_window": 200000, - "default_max_tokens": 64000, + "default_max_tokens": 32000, "can_reason": true, "reasoning_levels": [ "low", @@ -467,6 +467,25 @@ "supports_attachments": true, "options": {} }, + { + "id": "bytedance-seed/seed-2.0-lite", + "name": "ByteDance Seed: Seed-2.0-Lite", + "cost_per_1m_in": 0.25, + "cost_per_1m_out": 2, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 262144, + "default_max_tokens": 65536, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": true, + "options": {} + }, { "id": "bytedance-seed/seed-2.0-mini", "name": "ByteDance Seed: Seed-2.0-Mini", @@ -547,12 +566,12 @@ { "id": "deepseek/deepseek-chat-v3.1", "name": "DeepSeek: DeepSeek V3.1", - "cost_per_1m_in": 0.2, - "cost_per_1m_out": 0.8, + "cost_per_1m_in": 0.21, + "cost_per_1m_out": 0.79, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.1, + "cost_per_1m_out_cached": 0.13, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -566,29 +585,10 @@ { "id": "deepseek/deepseek-v3.1-terminus", "name": "DeepSeek: DeepSeek V3.1 Terminus", - "cost_per_1m_in": 0.23, - "cost_per_1m_out": 0.9, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.115, - "context_window": 163840, - "default_max_tokens": 32768, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false, - "options": {} - }, - { - "id": "deepseek/deepseek-v3.1-terminus:exacto", - "name": "DeepSeek: DeepSeek V3.1 Terminus (exacto)", "cost_per_1m_in": 0.21, "cost_per_1m_out": 0.79, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.168, + "cost_per_1m_out_cached": 0.13, "context_window": 163840, "default_max_tokens": 16384, "can_reason": true, @@ -609,7 +609,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.13, "context_window": 163840, - "default_max_tokens": 16384, + "default_max_tokens": 81920, "can_reason": true, "reasoning_levels": [ "low", @@ -838,7 +838,7 @@ "cost_per_1m_in_cached": 0.08333, "cost_per_1m_out_cached": 0.05, "context_window": 1048576, - "default_max_tokens": 32768, + "default_max_tokens": 32767, "can_reason": true, "reasoning_levels": [ "low", @@ -1043,7 +1043,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false, "options": {} @@ -1051,12 +1051,12 @@ { "id": "meta-llama/llama-3.3-70b-instruct", "name": "Meta: Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.25, - "cost_per_1m_out": 0.75, + "cost_per_1m_in": 0.59, + "cost_per_1m_out": 0.79, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 16384, "can_reason": false, "supports_attachments": false, "options": {} @@ -1077,12 +1077,12 @@ { "id": "meta-llama/llama-4-maverick", "name": "Meta: Llama 4 Maverick", - "cost_per_1m_in": 0.35, - "cost_per_1m_out": 1.15, + "cost_per_1m_in": 0.27, + "cost_per_1m_out": 0.85, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 524288, - "default_max_tokens": 4096, + "context_window": 1048576, + "default_max_tokens": 104857, "can_reason": false, "supports_attachments": true, "options": {} @@ -1142,7 +1142,7 @@ "id": "minimax/minimax-m2.1", "name": "MiniMax: MiniMax M2.1", "cost_per_1m_in": 0.3, - "cost_per_1m_out": 2.4, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.03, "context_window": 204800, @@ -1301,7 +1301,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": true, "options": {} @@ -1465,12 +1465,12 @@ { "id": "moonshotai/kimi-k2", "name": "MoonshotAI: Kimi K2 0711", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.5, + "cost_per_1m_in": 0.55, + "cost_per_1m_out": 2.2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, - "context_window": 131072, - "default_max_tokens": 13107, + "cost_per_1m_out_cached": 0, + "context_window": 131000, + "default_max_tokens": 13100, "can_reason": false, "supports_attachments": false, "options": {} @@ -1481,22 +1481,9 @@ "cost_per_1m_in": 0.6, "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.3, - "context_window": 262144, - "default_max_tokens": 26214, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, - { - "id": "moonshotai/kimi-k2-0905:exacto", - "name": "MoonshotAI: Kimi K2 0905 (exacto)", - "cost_per_1m_in": 1.15, - "cost_per_1m_out": 8, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "supports_attachments": false, "options": {} @@ -1523,10 +1510,10 @@ { "id": "moonshotai/kimi-k2.5", "name": "MoonshotAI: Kimi K2.5", - "cost_per_1m_in": 0.5, - "cost_per_1m_out": 2.5, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 3, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.1, "context_window": 262144, "default_max_tokens": 26214, "can_reason": true, @@ -2000,7 +1987,7 @@ "cost_per_1m_in": 1.25, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.125, + "cost_per_1m_out_cached": 0.13, "context_window": 400000, "default_max_tokens": 64000, "can_reason": true, @@ -2242,25 +2229,6 @@ "supports_attachments": false, "options": {} }, - { - "id": "openai/gpt-oss-120b:exacto", - "name": "OpenAI: gpt-oss-120b (exacto)", - "cost_per_1m_in": 0.039, - "cost_per_1m_out": 0.19, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 13107, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false, - "options": {} - }, { "id": "openai/gpt-oss-120b:free", "name": "OpenAI: gpt-oss-120b (free)", @@ -2283,12 +2251,12 @@ { "id": "openai/gpt-oss-20b", "name": "OpenAI: gpt-oss-20b", - "cost_per_1m_in": 0.03, - "cost_per_1m_out": 0.14, + "cost_per_1m_in": 0.045, + "cost_per_1m_out": 0.18, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 16384, "can_reason": true, "reasoning_levels": [ "low", @@ -2522,6 +2490,25 @@ "supports_attachments": false, "options": {} }, + { + "id": "qwen/qwq-32b", + "name": "Qwen: QwQ 32B", + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 0.58, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 65536, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", + "supports_attachments": false, + "options": {} + }, { "id": "qwen/qwen-plus-2025-07-28", "name": "Qwen: Qwen Plus 0728", @@ -2622,12 +2609,12 @@ { "id": "qwen/qwen3-14b", "name": "Qwen: Qwen3 14B", - "cost_per_1m_in": 0.2275, - "cost_per_1m_out": 0.91, + "cost_per_1m_in": 0.12, + "cost_per_1m_out": 0.24, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 4096, + "context_window": 40960, + "default_max_tokens": 20480, "can_reason": true, "reasoning_levels": [ "low", @@ -2660,12 +2647,12 @@ { "id": "qwen/qwen3-235b-a22b-2507", "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "cost_per_1m_in": 0.2, - "cost_per_1m_out": 0.8, + "cost_per_1m_in": 0.22, + "cost_per_1m_out": 0.88, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.2, + "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 8192, "can_reason": false, "supports_attachments": false, "options": {} @@ -2724,11 +2711,11 @@ { "id": "qwen/qwen3-32b", "name": "Qwen: Qwen3 32B", - "cost_per_1m_in": 0.104, - "cost_per_1m_out": 0.416, + "cost_per_1m_in": 0.08, + "cost_per_1m_out": 0.28, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, + "context_window": 40960, "default_max_tokens": 4096, "can_reason": true, "reasoning_levels": [ @@ -2795,24 +2782,11 @@ "id": "qwen/qwen3-coder", "name": "Qwen: Qwen3 Coder 480B A35B", "cost_per_1m_in": 0.22, - "cost_per_1m_out": 1.8, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 32768, - "can_reason": false, - "supports_attachments": false, - "options": {} - }, - { - "id": "qwen/qwen3-coder:exacto", - "name": "Qwen: Qwen3 Coder 480B A35B (exacto)", - "cost_per_1m_in": 0.22, - "cost_per_1m_out": 1.8, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.022, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": false, "options": {} @@ -2904,8 +2878,8 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 1.2, + "cost_per_1m_in": 0.1, + "cost_per_1m_out": 1.1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -2949,8 +2923,8 @@ { "id": "qwen/qwen3-vl-235b-a22b-instruct", "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "cost_per_1m_in": 0.26, - "cost_per_1m_out": 1.04, + "cost_per_1m_in": 0.21, + "cost_per_1m_out": 1.9, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, @@ -2994,12 +2968,12 @@ { "id": "qwen/qwen3-vl-30b-a3b-thinking", "name": "Qwen: Qwen3 VL 30B A3B Thinking", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, + "cost_per_1m_in": 0.29, + "cost_per_1m_out": 1, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 16384, + "context_window": 262144, + "default_max_tokens": 131072, "can_reason": true, "reasoning_levels": [ "low", @@ -3096,10 +3070,10 @@ { "id": "qwen/qwen3.5-122b-a10b", "name": "Qwen: Qwen3.5-122B-A10B", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 2.4, + "cost_per_1m_in": 0.26, + "cost_per_1m_out": 2.08, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.3, + "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 32768, "can_reason": true, @@ -3115,8 +3089,8 @@ { "id": "qwen/qwen3.5-27b", "name": "Qwen: Qwen3.5-27B", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 2.4, + "cost_per_1m_in": 0.195, + "cost_per_1m_out": 1.56, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, @@ -3134,12 +3108,12 @@ { "id": "qwen/qwen3.5-35b-a3b", "name": "Qwen: Qwen3.5-35B-A3B", - "cost_per_1m_in": 0.25, - "cost_per_1m_out": 1, + "cost_per_1m_in": 0.225, + "cost_per_1m_out": 1.8, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.225, "context_window": 262144, - "default_max_tokens": 131072, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low", @@ -3433,31 +3407,12 @@ { "id": "z-ai/glm-4.6", "name": "Z.ai: GLM 4.6", - "cost_per_1m_in": 0.55, - "cost_per_1m_out": 2.2, + "cost_per_1m_in": 0.39, + "cost_per_1m_out": 1.9, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, + "cost_per_1m_out_cached": 0, "context_window": 204800, - "default_max_tokens": 65536, - "can_reason": true, - "reasoning_levels": [ - "low", - "medium", - "high" - ], - "default_reasoning_effort": "medium", - "supports_attachments": false, - "options": {} - }, - { - "id": "z-ai/glm-4.6:exacto", - "name": "Z.ai: GLM 4.6 (exacto)", - "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.2, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, - "context_window": 200000, - "default_max_tokens": 64000, + "default_max_tokens": 102400, "can_reason": true, "reasoning_levels": [ "low", @@ -3476,7 +3431,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ "low", @@ -3509,10 +3464,10 @@ { "id": "z-ai/glm-4.7-flash", "name": "Z.ai: GLM 4.7 Flash", - "cost_per_1m_in": 0.1, - "cost_per_1m_out": 0.43, + "cost_per_1m_in": 0.06, + "cost_per_1m_out": 0.4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, + "cost_per_1m_out_cached": 0.01, "context_window": 202752, "default_max_tokens": 20275, "can_reason": true, @@ -3528,11 +3483,11 @@ { "id": "z-ai/glm-5", "name": "Z.ai: GLM 5", - "cost_per_1m_in": 0.95, - "cost_per_1m_out": 2.55, + "cost_per_1m_in": 1, + "cost_per_1m_out": 3.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0.2, - "context_window": 204800, + "context_window": 202800, "default_max_tokens": 65536, "can_reason": true, "reasoning_levels": [ @@ -3547,10 +3502,10 @@ { "id": "x-ai/grok-3", "name": "xAI: Grok 3", - "cost_per_1m_in": 3, - "cost_per_1m_out": 15, + "cost_per_1m_in": 5, + "cost_per_1m_out": 25, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.75, + "cost_per_1m_out_cached": 1.25, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, @@ -3560,10 +3515,10 @@ { "id": "x-ai/grok-3-beta", "name": "xAI: Grok 3 Beta", - "cost_per_1m_in": 3, - "cost_per_1m_out": 15, + "cost_per_1m_in": 5, + "cost_per_1m_out": 25, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.75, + "cost_per_1m_out_cached": 1.25, "context_window": 131072, "default_max_tokens": 13107, "can_reason": false, diff --git a/internal/providers/configs/synthetic.json b/internal/providers/configs/synthetic.json index 4b893ff14aa6b9de45e43be4779697cee1e8f9f3..4533d0eb0bef431ac58a63f8c55298e305b2f477 100644 --- a/internal/providers/configs/synthetic.json +++ b/internal/providers/configs/synthetic.json @@ -253,11 +253,11 @@ "id": "hf:Qwen/Qwen3.5-397B-A17B", "name": "Qwen3.5 397B A17B", "cost_per_1m_in": 0.6, - "cost_per_1m_out": 3, + "cost_per_1m_out": 3.6, "cost_per_1m_in_cached": 0.6, "cost_per_1m_out_cached": 0.6, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 26214, "can_reason": false, "supports_attachments": true, "options": {} diff --git a/internal/providers/configs/venice.json b/internal/providers/configs/venice.json index ccd34fe0b621211789e35a328775a1d520e27a7b..eca1fcbe4fc35322c65f748cc9f8f0afbbe399e8 100644 --- a/internal/providers/configs/venice.json +++ b/internal/providers/configs/venice.json @@ -141,8 +141,8 @@ "cost_per_1m_out": 0.8, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 128000, - "default_max_tokens": 32000, + "context_window": 200000, + "default_max_tokens": 32768, "can_reason": true, "reasoning_levels": [ "low",