neuralwatt.json

  1{
  2  "name": "Neuralwatt",
  3  "id": "neuralwatt",
  4  "api_key": "$NEURALWATT_API_KEY",
  5  "api_endpoint": "https://api.neuralwatt.com/v1",
  6  "type": "openai-compat",
  7  "default_large_model_id": "zai-org/GLM-5.1-FP8",
  8  "default_small_model_id": "mistralai/Devstral-Small-2-24B-Instruct-2512",
  9  "models": [
 10    {
 11      "id": "mistralai/Devstral-Small-2-24B-Instruct-2512",
 12      "name": "Devstral Small 2 24B Instruct 2512",
 13      "cost_per_1m_in": 0.1,
 14      "cost_per_1m_out": 0.3,
 15      "cost_per_1m_in_cached": 0,
 16      "cost_per_1m_out_cached": 0,
 17      "context_window": 262144,
 18      "default_max_tokens": 26214,
 19      "can_reason": false,
 20      "supports_attachments": true
 21    },
 22    {
 23      "id": "zai-org/GLM-5.1-FP8",
 24      "name": "GLM 5.1 FP8",
 25      "cost_per_1m_in": 1.1,
 26      "cost_per_1m_out": 3.6,
 27      "cost_per_1m_in_cached": 0,
 28      "cost_per_1m_out_cached": 0,
 29      "context_window": 202752,
 30      "default_max_tokens": 20275,
 31      "can_reason": true,
 32      "reasoning_levels": [
 33        "low",
 34        "medium",
 35        "high"
 36      ],
 37      "default_reasoning_effort": "medium",
 38      "supports_attachments": false
 39    },
 40    {
 41      "id": "glm-5.1-fast",
 42      "name": "GLM 5.1 Fast",
 43      "cost_per_1m_in": 1.1,
 44      "cost_per_1m_out": 3.6,
 45      "cost_per_1m_in_cached": 0,
 46      "cost_per_1m_out_cached": 0,
 47      "context_window": 202752,
 48      "default_max_tokens": 20275,
 49      "can_reason": false,
 50      "supports_attachments": false
 51    },
 52    {
 53      "id": "moonshotai/Kimi-K2.5",
 54      "name": "Kimi K2.5",
 55      "cost_per_1m_in": 0.5,
 56      "cost_per_1m_out": 2.6,
 57      "cost_per_1m_in_cached": 0,
 58      "cost_per_1m_out_cached": 0,
 59      "context_window": 262144,
 60      "default_max_tokens": 26214,
 61      "can_reason": false,
 62      "supports_attachments": true
 63    },
 64    {
 65      "id": "kimi-k2.5-fast",
 66      "name": "Kimi K2.5 Fast",
 67      "cost_per_1m_in": 0.5,
 68      "cost_per_1m_out": 2.6,
 69      "cost_per_1m_in_cached": 0,
 70      "cost_per_1m_out_cached": 0,
 71      "context_window": 262144,
 72      "default_max_tokens": 26214,
 73      "can_reason": false,
 74      "supports_attachments": true
 75    },
 76    {
 77      "id": "MiniMaxAI/MiniMax-M2.5",
 78      "name": "MiniMax M2.5",
 79      "cost_per_1m_in": 0.3,
 80      "cost_per_1m_out": 1.4,
 81      "cost_per_1m_in_cached": 0,
 82      "cost_per_1m_out_cached": 0,
 83      "context_window": 196608,
 84      "default_max_tokens": 19660,
 85      "can_reason": true,
 86      "reasoning_levels": [
 87        "low",
 88        "medium",
 89        "high"
 90      ],
 91      "default_reasoning_effort": "medium",
 92      "supports_attachments": false
 93    },
 94    {
 95      "id": "Qwen/Qwen3.5-397B-A17B-FP8",
 96      "name": "Qwen3.5 397B A17B FP8",
 97      "cost_per_1m_in": 0.7,
 98      "cost_per_1m_out": 4.1,
 99      "cost_per_1m_in_cached": 0,
100      "cost_per_1m_out_cached": 0,
101      "context_window": 262144,
102      "default_max_tokens": 26214,
103      "can_reason": true,
104      "reasoning_levels": [
105        "low",
106        "medium",
107        "high"
108      ],
109      "default_reasoning_effort": "medium",
110      "supports_attachments": false
111    },
112    {
113      "id": "qwen3.5-397b-fast",
114      "name": "Qwen3.5 397B Fast",
115      "cost_per_1m_in": 0.7,
116      "cost_per_1m_out": 4.1,
117      "cost_per_1m_in_cached": 0,
118      "cost_per_1m_out_cached": 0,
119      "context_window": 262144,
120      "default_max_tokens": 26214,
121      "can_reason": false,
122      "supports_attachments": false
123    }
124  ]
125}