diff --git a/internal/providers/configs/openrouter.json b/internal/providers/configs/openrouter.json index 544a0a2c0cfa0afa15712c1f9200c72cb83bcf81..f2468e0a83956ec9de1b6e7eab42a7c9b2368fa7 100644 --- a/internal/providers/configs/openrouter.json +++ b/internal/providers/configs/openrouter.json @@ -129,8 +129,8 @@ "name": "Anthropic: Claude 3.5 Sonnet", "cost_per_1m_in": 3, "cost_per_1m_out": 15, - "cost_per_1m_in_cached": 3.75, - "cost_per_1m_out_cached": 0.3, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, "context_window": 200000, "default_max_tokens": 4096, "can_reason": false, @@ -413,12 +413,12 @@ { "id": "deepseek/deepseek-v3.2-exp", "name": "DeepSeek: DeepSeek V3.2 Exp", - "cost_per_1m_in": 0.28, + "cost_per_1m_in": 0.27, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 163840, - "default_max_tokens": 32768, + "default_max_tokens": 16384, "can_reason": true, "has_reasoning_efforts": true, "supports_attachments": false @@ -427,11 +427,11 @@ "id": "deepseek/deepseek-r1", "name": "DeepSeek: R1", "cost_per_1m_in": 0.7, - "cost_per_1m_out": 2.4, + "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 163840, - "default_max_tokens": 81920, + "context_window": 64000, + "default_max_tokens": 8000, "can_reason": true, "has_reasoning_efforts": true, "supports_attachments": false @@ -520,7 +520,7 @@ "cost_per_1m_in": 0.09999999999999999, "cost_per_1m_out": 0.39999999999999997, "cost_per_1m_in_cached": 0.18330000000000002, - "cost_per_1m_out_cached": 0.024999999999999998, + "cost_per_1m_out_cached": 0.01, "context_window": 1048576, "default_max_tokens": 32767, "can_reason": true, @@ -561,7 +561,7 @@ "cost_per_1m_in_cached": 0.3833, "cost_per_1m_out_cached": 0.075, "context_window": 1048576, - "default_max_tokens": 32768, + "default_max_tokens": 32767, "can_reason": true, "has_reasoning_efforts": true, "supports_attachments": true @@ -605,19 +605,6 @@ "has_reasoning_efforts": true, "supports_attachments": true }, - { - "id": "google/gemma-3-27b-it", - "name": "Google: Gemma 3 27B", - "cost_per_1m_in": 0.13, - "cost_per_1m_out": 0.52, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 96000, - "default_max_tokens": 48000, - "can_reason": false, - "has_reasoning_efforts": false, - "supports_attachments": true - }, { "id": "inception/mercury", "name": "Inception: Mercury", @@ -686,12 +673,12 @@ { "id": "meta-llama/llama-3.1-405b-instruct", "name": "Meta: Llama 3.1 405B Instruct", - "cost_per_1m_in": 0.7999999999999999, - "cost_per_1m_out": 0.7999999999999999, + "cost_per_1m_in": 3.5, + "cost_per_1m_out": 3.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 8192, + "context_window": 130815, + "default_max_tokens": 13081, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -738,12 +725,12 @@ { "id": "meta-llama/llama-3.3-70b-instruct", "name": "Meta: Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.13, - "cost_per_1m_out": 0.38, + "cost_per_1m_in": 0.85, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 8192, + "default_max_tokens": 16000, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -777,12 +764,12 @@ { "id": "meta-llama/llama-4-maverick", "name": "Meta: Llama 4 Maverick", - "cost_per_1m_in": 0.15, + "cost_per_1m_in": 0.16999999999999998, "cost_per_1m_out": 0.85, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 1048576, - "default_max_tokens": 8192, + "default_max_tokens": 524288, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": true @@ -898,8 +885,8 @@ "cost_per_1m_out": 6, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 3276, + "context_window": 131072, + "default_max_tokens": 13107, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -937,8 +924,8 @@ "cost_per_1m_out": 0.8999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 3276, + "context_window": 262144, + "default_max_tokens": 26214, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -1002,7 +989,7 @@ "cost_per_1m_out": 5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, + "context_window": 40960, "default_max_tokens": 20000, "can_reason": true, "has_reasoning_efforts": true, @@ -1028,7 +1015,7 @@ "cost_per_1m_out": 1.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, + "context_window": 40000, "default_max_tokens": 20000, "can_reason": true, "has_reasoning_efforts": true, @@ -1093,8 +1080,8 @@ "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 3276, + "context_window": 131072, + "default_max_tokens": 13107, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": true @@ -1223,8 +1210,8 @@ "cost_per_1m_out": 0.15, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 3276, + "context_window": 131072, + "default_max_tokens": 13107, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": true @@ -1236,8 +1223,8 @@ "cost_per_1m_out": 6, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, - "context_window": 32768, - "default_max_tokens": 3276, + "context_window": 131072, + "default_max_tokens": 13107, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": true @@ -1261,9 +1248,9 @@ "cost_per_1m_in": 0.6, "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.15, + "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 8192, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -1271,12 +1258,12 @@ { "id": "moonshotai/kimi-k2-0905", "name": "MoonshotAI: Kimi K2 0905", - "cost_per_1m_in": 0.5, - "cost_per_1m_out": 2, + "cost_per_1m_in": 0.39, + "cost_per_1m_out": 1.9, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -1372,6 +1359,32 @@ "has_reasoning_efforts": false, "supports_attachments": false }, + { + "id": "nousresearch/hermes-4-405b", + "name": "Nous: Hermes 4 405B", + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 65536, + "can_reason": true, + "has_reasoning_efforts": true, + "supports_attachments": false + }, + { + "id": "nousresearch/hermes-4-70b", + "name": "Nous: Hermes 4 70B", + "cost_per_1m_in": 0.11, + "cost_per_1m_out": 0.38, + "cost_per_1m_in_cached": 0, + "cost_per_1m_out_cached": 0, + "context_window": 131072, + "default_max_tokens": 65536, + "can_reason": true, + "has_reasoning_efforts": true, + "supports_attachments": false + }, { "id": "openai/codex-mini", "name": "OpenAI: Codex Mini", @@ -1534,7 +1547,7 @@ "cost_per_1m_in": 2.5, "cost_per_1m_out": 10, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 8192, "can_reason": false, @@ -1882,12 +1895,12 @@ { "id": "qwen/qwen-2.5-72b-instruct", "name": "Qwen2.5 72B Instruct", - "cost_per_1m_in": 0.07, - "cost_per_1m_out": 0.26, + "cost_per_1m_in": 0.12, + "cost_per_1m_out": 0.39, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 32768, - "default_max_tokens": 16384, + "default_max_tokens": 8192, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -2022,30 +2035,17 @@ "has_reasoning_efforts": true, "supports_attachments": false }, - { - "id": "qwen/qwen3-235b-a22b:free", - "name": "Qwen: Qwen3 235B A22B (free)", - "cost_per_1m_in": 0, - "cost_per_1m_out": 0, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 131072, - "default_max_tokens": 13107, - "can_reason": false, - "has_reasoning_efforts": false, - "supports_attachments": false - }, { "id": "qwen/qwen3-235b-a22b-2507", "name": "Qwen: Qwen3 235B A22B Instruct 2507", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.09999999999999999, + "cost_per_1m_in": 0.22, + "cost_per_1m_out": 0.7999999999999999, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 131072, - "can_reason": false, - "has_reasoning_efforts": false, + "can_reason": true, + "has_reasoning_efforts": true, "supports_attachments": false }, { @@ -2077,12 +2077,12 @@ { "id": "qwen/qwen3-30b-a3b-instruct-2507", "name": "Qwen: Qwen3 30B A3B Instruct 2507", - "cost_per_1m_in": 0.09999999999999999, - "cost_per_1m_out": 0.3, + "cost_per_1m_in": 0.08, + "cost_per_1m_out": 0.33, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -2103,12 +2103,12 @@ { "id": "qwen/qwen3-32b", "name": "Qwen: Qwen3 32B", - "cost_per_1m_in": 0.15, - "cost_per_1m_out": 0.5, + "cost_per_1m_in": 0.14, + "cost_per_1m_out": 0.5700000000000001, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 4000, + "default_max_tokens": 65536, "can_reason": true, "has_reasoning_efforts": true, "supports_attachments": false @@ -2147,7 +2147,7 @@ "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 32768, + "default_max_tokens": 26214, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -2207,12 +2207,12 @@ { "id": "qwen/qwen3-next-80b-a3b-instruct", "name": "Qwen: Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.14, - "cost_per_1m_out": 1.1, + "cost_per_1m_in": 0.15, + "cost_per_1m_out": 1.2, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 262144, - "default_max_tokens": 26214, + "default_max_tokens": 131072, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": false @@ -2233,12 +2233,12 @@ { "id": "qwen/qwen3-vl-235b-a22b-instruct", "name": "Qwen: Qwen3 VL 235B A22B Instruct", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 1.2, + "cost_per_1m_in": 0.5, + "cost_per_1m_out": 2.5, "cost_per_1m_in_cached": 0, "cost_per_1m_out_cached": 0, "context_window": 131072, - "default_max_tokens": 13107, + "default_max_tokens": 65536, "can_reason": false, "has_reasoning_efforts": false, "supports_attachments": true @@ -2256,19 +2256,6 @@ "has_reasoning_efforts": true, "supports_attachments": true }, - { - "id": "qwen/qwen3-vl-30b-a3b-instruct", - "name": "Qwen: Qwen3 VL 30B A3B Instruct", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 1, - "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0, - "context_window": 262144, - "default_max_tokens": 131072, - "can_reason": false, - "has_reasoning_efforts": false, - "supports_attachments": true - }, { "id": "qwen/qwen3-vl-30b-a3b-thinking", "name": "Qwen: Qwen3 VL 30B A3B Thinking", @@ -2455,11 +2442,11 @@ "id": "z-ai/glm-4.6", "name": "Z.AI: GLM 4.6", "cost_per_1m_in": 0.6, - "cost_per_1m_out": 2.2, + "cost_per_1m_out": 2, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.11, + "cost_per_1m_out_cached": 0, "context_window": 204800, - "default_max_tokens": 65536, + "default_max_tokens": 20480, "can_reason": true, "has_reasoning_efforts": true, "supports_attachments": false @@ -2519,10 +2506,10 @@ { "id": "x-ai/grok-3-mini", "name": "xAI: Grok 3 Mini", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.5, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.075, + "cost_per_1m_out_cached": 0.15, "context_window": 131072, "default_max_tokens": 13107, "can_reason": true, @@ -2532,10 +2519,10 @@ { "id": "x-ai/grok-3-mini-beta", "name": "xAI: Grok 3 Mini Beta", - "cost_per_1m_in": 0.3, - "cost_per_1m_out": 0.5, + "cost_per_1m_in": 0.6, + "cost_per_1m_out": 4, "cost_per_1m_in_cached": 0, - "cost_per_1m_out_cached": 0.075, + "cost_per_1m_out_cached": 0.15, "context_window": 131072, "default_max_tokens": 13107, "can_reason": true,