diff --git a/internal/agent/hyper/provider.json b/internal/agent/hyper/provider.json index 0d5e9d9a5e369057c800c993d936612d6cecab2d..eaff83c710da702b0de3982babe87cdf7a5f5cb7 100644 --- a/internal/agent/hyper/provider.json +++ b/internal/agent/hyper/provider.json @@ -14,14 +14,13 @@ "cost_per_1m_in_cached": 0.0028, "cost_per_1m_out_cached": 0, "context_window": 1000000, - "default_max_tokens": 8000, + "default_max_tokens": 384000, "can_reason": true, "reasoning_levels": [ - "low", - "medium", - "high" + "high", + "xhigh" ], - "default_reasoning_effort": "medium", + "default_reasoning_effort": "high", "supports_attachments": true }, { @@ -32,22 +31,21 @@ "cost_per_1m_in_cached": 0.0036, "cost_per_1m_out_cached": 0, "context_window": 1000000, - "default_max_tokens": 8000, + "default_max_tokens": 384000, "can_reason": true, "reasoning_levels": [ - "low", - "medium", - "high" + "high", + "xhigh" ], - "default_reasoning_effort": "medium", - "supports_attachments": true + "default_reasoning_effort": "high", + "supports_attachments": false }, { "id": "gemma-4-26b-a4b-it", "name": "Gemma 4 26B A4B", - "cost_per_1m_in": 0.116, - "cost_per_1m_out": 0.408, - "cost_per_1m_in_cached": 0.058, + "cost_per_1m_in": 0.102, + "cost_per_1m_out": 0.394, + "cost_per_1m_in_cached": 0.051, "cost_per_1m_out_cached": 0, "context_window": 256000, "default_max_tokens": 25600, @@ -57,9 +55,9 @@ { "id": "glm-5", "name": "GLM-5", - "cost_per_1m_in": 0.96, - "cost_per_1m_out": 3.036, - "cost_per_1m_in_cached": 0.48, + "cost_per_1m_in": 0.99, + "cost_per_1m_out": 3.07, + "cost_per_1m_in_cached": 0.495, "cost_per_1m_out_cached": 0, "context_window": 202752, "default_max_tokens": 20275, @@ -74,7 +72,7 @@ "cost_per_1m_in_cached": 0.26, "cost_per_1m_out_cached": 0, "context_window": 202800, - "default_max_tokens": 8000, + "default_max_tokens": 64000, "can_reason": true, "reasoning_levels": [ "low", @@ -87,9 +85,9 @@ { "id": "gpt-oss-120b", "name": "gpt-oss-120b", - "cost_per_1m_in": 0.18, - "cost_per_1m_out": 0.61, - "cost_per_1m_in_cached": 0.09, + "cost_per_1m_in": 0.178, + "cost_per_1m_out": 0.68, + "cost_per_1m_in_cached": 0.089, "cost_per_1m_out_cached": 0, "context_window": 131072, "default_max_tokens": 13107, @@ -105,9 +103,9 @@ { "id": "kimi-k2.5", "name": "Kimi K2.5", - "cost_per_1m_in": 0.522, - "cost_per_1m_out": 2.69, - "cost_per_1m_in_cached": 0.261, + "cost_per_1m_in": 0.518, + "cost_per_1m_out": 2.57, + "cost_per_1m_in_cached": 0.259, "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 26214, @@ -122,7 +120,7 @@ "cost_per_1m_in_cached": 0.16, "cost_per_1m_out_cached": 0, "context_window": 262000, - "default_max_tokens": 8000, + "default_max_tokens": 262000, "can_reason": true, "reasoning_levels": [ "low", @@ -135,9 +133,9 @@ { "id": "llama-3.3-70b-instruct", "name": "Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.523, - "cost_per_1m_out": 0.786, - "cost_per_1m_in_cached": 0.2615, + "cost_per_1m_in": 0.574, + "cost_per_1m_out": 0.668, + "cost_per_1m_in_cached": 0.287, "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 12800, @@ -159,13 +157,19 @@ { "id": "minimax-m2.7", "name": "MiniMax M2.7", - "cost_per_1m_in": 0.44, - "cost_per_1m_out": 1.76, - "cost_per_1m_in_cached": 0.22, - "cost_per_1m_out_cached": 0, + "cost_per_1m_in": 0.3, + "cost_per_1m_out": 1.2, + "cost_per_1m_in_cached": 0.06, + "cost_per_1m_out_cached": 0.375, "context_window": 204800, - "default_max_tokens": 20480, - "can_reason": false, + "default_max_tokens": 131000, + "can_reason": true, + "reasoning_levels": [ + "low", + "medium", + "high" + ], + "default_reasoning_effort": "medium", "supports_attachments": false }, { @@ -219,9 +223,9 @@ { "id": "qwen3-coder-480b-a35b-instruct-int4-mixed-ar", "name": "Qwen3 Coder 480B A35B Instruct INT4 Mixed AR", - "cost_per_1m_in": 0.801, - "cost_per_1m_out": 2.185, - "cost_per_1m_in_cached": 0.4005, + "cost_per_1m_in": 0.531, + "cost_per_1m_out": 2.605, + "cost_per_1m_in_cached": 0.2655, "cost_per_1m_out_cached": 0, "context_window": 106000, "default_max_tokens": 10600, @@ -231,9 +235,9 @@ { "id": "qwen3-next-80b-a3b-instruct", "name": "Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.1295, - "cost_per_1m_out": 1.216, - "cost_per_1m_in_cached": 0.06475, + "cost_per_1m_in": 0.128, + "cost_per_1m_out": 1.28, + "cost_per_1m_in_cached": 0.064, "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 26214,