diff --git a/internal/agent/hyper/provider.json b/internal/agent/hyper/provider.json index 6d3a324282602b0e19552271ae63bb05d452eefa..b71e1ceec4784d8e75d9b0c3f5995aa0e30525f6 100644 --- a/internal/agent/hyper/provider.json +++ b/internal/agent/hyper/provider.json @@ -9,9 +9,9 @@ { "id": "deepseek-v4-flash", "name": "DeepSeek V4 Flash", - "cost_per_1m_in": 0.1416, - "cost_per_1m_out": 0.2832, - "cost_per_1m_in_cached": 0.0708, + "cost_per_1m_in": 0.1446, + "cost_per_1m_out": 0.2912, + "cost_per_1m_in_cached": 0.0723, "cost_per_1m_out_cached": 0, "context_window": 1048576, "default_max_tokens": 104857, @@ -21,9 +21,9 @@ { "id": "deepseek-v4-pro", "name": "DeepSeek V4 Pro", - "cost_per_1m_in": 1.7422, - "cost_per_1m_out": 3.6396, - "cost_per_1m_in_cached": 0.8711, + "cost_per_1m_in": 1.6082, + "cost_per_1m_out": 3.2164, + "cost_per_1m_in_cached": 0.8041, "cost_per_1m_out_cached": 0, "context_window": 1048576, "default_max_tokens": 60000, @@ -69,9 +69,9 @@ { "id": "gpt-oss-120b", "name": "gpt-oss-120b", - "cost_per_1m_in": 0.178, - "cost_per_1m_out": 0.68, - "cost_per_1m_in_cached": 0.089, + "cost_per_1m_in": 0.19, + "cost_per_1m_out": 0.63, + "cost_per_1m_in_cached": 0.095, "cost_per_1m_out_cached": 0, "context_window": 131072, "default_max_tokens": 13107, @@ -87,9 +87,9 @@ { "id": "kimi-k2.5", "name": "Kimi K2.5", - "cost_per_1m_in": 0.556, - "cost_per_1m_out": 2.88, - "cost_per_1m_in_cached": 0.278, + "cost_per_1m_in": 0.522, + "cost_per_1m_out": 2.69, + "cost_per_1m_in_cached": 0.261, "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 26214, @@ -99,9 +99,9 @@ { "id": "kimi-k2.6", "name": "Kimi K2.6", - "cost_per_1m_in": 0.918, - "cost_per_1m_out": 4.151, - "cost_per_1m_in_cached": 0.459, + "cost_per_1m_in": 0.956, + "cost_per_1m_out": 4, + "cost_per_1m_in_cached": 0.478, "cost_per_1m_out_cached": 0, "context_window": 262142, "default_max_tokens": 26214, @@ -111,9 +111,9 @@ { "id": "llama-3.3-70b-instruct", "name": "Llama 3.3 70B Instruct", - "cost_per_1m_in": 0.638, - "cost_per_1m_out": 0.768, - "cost_per_1m_in_cached": 0.319, + "cost_per_1m_in": 0.45, + "cost_per_1m_out": 0.72, + "cost_per_1m_in_cached": 0.225, "cost_per_1m_out_cached": 0, "context_window": 128000, "default_max_tokens": 12800, @@ -124,7 +124,7 @@ "id": "llama-4-maverick-17b-128e-instruct-fp8", "name": "Llama 4 Maverick 17B 128E Instruct FP8", "cost_per_1m_in": 0.35, - "cost_per_1m_out": 1.0625, + "cost_per_1m_out": 1.08, "cost_per_1m_in_cached": 0.175, "cost_per_1m_out_cached": 0, "context_window": 430000, @@ -135,9 +135,9 @@ { "id": "minimax-m2.7", "name": "MiniMax M2.7", - "cost_per_1m_in": 0.42, - "cost_per_1m_out": 1.68, - "cost_per_1m_in_cached": 0.21, + "cost_per_1m_in": 0.38, + "cost_per_1m_out": 1.52, + "cost_per_1m_in_cached": 0.19, "cost_per_1m_out_cached": 0, "context_window": 204800, "default_max_tokens": 20480, @@ -161,8 +161,8 @@ "name": "Qwen3.6-Flash", "cost_per_1m_in": 1, "cost_per_1m_out": 4, - "cost_per_1m_in_cached": 0.1, - "cost_per_1m_out_cached": 1.25, + "cost_per_1m_in_cached": 1.25, + "cost_per_1m_out_cached": 0.1, "context_window": 1000000, "default_max_tokens": 64000, "can_reason": true, @@ -173,8 +173,8 @@ "name": "Qwen3.6-Max", "cost_per_1m_in": 2, "cost_per_1m_out": 12, - "cost_per_1m_in_cached": 0.2, - "cost_per_1m_out_cached": 2.5, + "cost_per_1m_in_cached": 2.5, + "cost_per_1m_out_cached": 0.2, "context_window": 256000, "default_max_tokens": 64000, "can_reason": true, @@ -185,19 +185,31 @@ "name": "Qwen3.6-Plus", "cost_per_1m_in": 2, "cost_per_1m_out": 6, - "cost_per_1m_in_cached": 0.2, - "cost_per_1m_out_cached": 2.5, + "cost_per_1m_in_cached": 2.5, + "cost_per_1m_out_cached": 0.2, "context_window": 1000000, "default_max_tokens": 64000, "can_reason": true, "supports_attachments": true }, + { + "id": "qwen3.7-max", + "name": "Qwen3.7-Max", + "cost_per_1m_in": 2.5, + "cost_per_1m_out": 7.5, + "cost_per_1m_in_cached": 3.125, + "cost_per_1m_out_cached": 0.25, + "context_window": 1000000, + "default_max_tokens": 64000, + "can_reason": true, + "supports_attachments": false + }, { "id": "qwen3-coder-480b-a35b-instruct-int4-mixed-ar", "name": "Qwen3 Coder 480B A35B Instruct INT4 Mixed AR", - "cost_per_1m_in": 0.871, - "cost_per_1m_out": 2.805, - "cost_per_1m_in_cached": 0.4355, + "cost_per_1m_in": 0.736, + "cost_per_1m_out": 2.03, + "cost_per_1m_in_cached": 0.368, "cost_per_1m_out_cached": 0, "context_window": 106000, "default_max_tokens": 10600, @@ -207,9 +219,9 @@ { "id": "qwen3-next-80b-a3b-instruct", "name": "Qwen3 Next 80B A3B Instruct", - "cost_per_1m_in": 0.128, - "cost_per_1m_out": 1.28, - "cost_per_1m_in_cached": 0.064, + "cost_per_1m_in": 0.1175, + "cost_per_1m_out": 1.136, + "cost_per_1m_in_cached": 0.05875, "cost_per_1m_out_cached": 0, "context_window": 262144, "default_max_tokens": 26214,