chutes.json

  1{
  2  "name": "Chutes",
  3  "id": "chutes",
  4  "api_key": "$CHUTES_API_KEY",
  5  "api_endpoint": "https://llm.chutes.ai/v1",
  6  "type": "openai-compat",
  7  "default_large_model_id": "zai-org/GLM-5-TEE",
  8  "default_small_model_id": "zai-org/GLM-5-Turbo",
  9  "models": [
 10    {
 11      "id": "deepseek-ai/DeepSeek-R1-0528-TEE",
 12      "name": "DeepSeek-R1-0528-TEE",
 13      "cost_per_1m_in": 0.45,
 14      "cost_per_1m_out": 2.15,
 15      "cost_per_1m_in_cached": 0.225,
 16      "cost_per_1m_out_cached": 0,
 17      "context_window": 163840,
 18      "default_max_tokens": 65536,
 19      "can_reason": true,
 20      "reasoning_levels": [
 21        "low",
 22        "medium",
 23        "high"
 24      ],
 25      "default_reasoning_effort": "medium",
 26      "supports_attachments": false
 27    },
 28    {
 29      "id": "tngtech/DeepSeek-TNG-R1T2-Chimera-TEE",
 30      "name": "DeepSeek-TNG-R1T2-Chimera-TEE",
 31      "cost_per_1m_in": 0.3,
 32      "cost_per_1m_out": 1.1,
 33      "cost_per_1m_in_cached": 0.15,
 34      "cost_per_1m_out_cached": 0,
 35      "context_window": 163840,
 36      "default_max_tokens": 163840,
 37      "can_reason": true,
 38      "reasoning_levels": [
 39        "low",
 40        "medium",
 41        "high"
 42      ],
 43      "default_reasoning_effort": "medium",
 44      "supports_attachments": false
 45    },
 46    {
 47      "id": "deepseek-ai/DeepSeek-V3-0324-TEE",
 48      "name": "DeepSeek-V3-0324-TEE",
 49      "cost_per_1m_in": 0.25,
 50      "cost_per_1m_out": 1,
 51      "cost_per_1m_in_cached": 0.125,
 52      "cost_per_1m_out_cached": 0,
 53      "context_window": 163840,
 54      "default_max_tokens": 65536,
 55      "can_reason": false,
 56      "supports_attachments": false
 57    },
 58    {
 59      "id": "deepseek-ai/DeepSeek-V3.1-TEE",
 60      "name": "DeepSeek-V3.1-TEE",
 61      "cost_per_1m_in": 0.27,
 62      "cost_per_1m_out": 1,
 63      "cost_per_1m_in_cached": 0.135,
 64      "cost_per_1m_out_cached": 0,
 65      "context_window": 163840,
 66      "default_max_tokens": 65536,
 67      "can_reason": true,
 68      "reasoning_levels": [
 69        "low",
 70        "medium",
 71        "high"
 72      ],
 73      "default_reasoning_effort": "medium",
 74      "supports_attachments": false
 75    },
 76    {
 77      "id": "deepseek-ai/DeepSeek-V3.2-TEE",
 78      "name": "DeepSeek-V3.2-TEE",
 79      "cost_per_1m_in": 0.28,
 80      "cost_per_1m_out": 0.42,
 81      "cost_per_1m_in_cached": 0.14,
 82      "cost_per_1m_out_cached": 0,
 83      "context_window": 131072,
 84      "default_max_tokens": 65536,
 85      "can_reason": true,
 86      "reasoning_levels": [
 87        "low",
 88        "medium",
 89        "high"
 90      ],
 91      "default_reasoning_effort": "medium",
 92      "supports_attachments": false
 93    },
 94    {
 95      "id": "zai-org/GLM-4.6V",
 96      "name": "GLM-4.6V",
 97      "cost_per_1m_in": 0.3,
 98      "cost_per_1m_out": 0.9,
 99      "cost_per_1m_in_cached": 0.15,
100      "cost_per_1m_out_cached": 0,
101      "context_window": 131072,
102      "default_max_tokens": 65536,
103      "can_reason": true,
104      "reasoning_levels": [
105        "low",
106        "medium",
107        "high"
108      ],
109      "default_reasoning_effort": "medium",
110      "supports_attachments": true
111    },
112    {
113      "id": "zai-org/GLM-4.7-TEE",
114      "name": "GLM-4.7-TEE",
115      "cost_per_1m_in": 0.39,
116      "cost_per_1m_out": 1.75,
117      "cost_per_1m_in_cached": 0.195,
118      "cost_per_1m_out_cached": 0,
119      "context_window": 202752,
120      "default_max_tokens": 65535,
121      "can_reason": true,
122      "reasoning_levels": [
123        "low",
124        "medium",
125        "high"
126      ],
127      "default_reasoning_effort": "medium",
128      "supports_attachments": false
129    },
130    {
131      "id": "zai-org/GLM-5-TEE",
132      "name": "GLM-5-TEE",
133      "cost_per_1m_in": 0.95,
134      "cost_per_1m_out": 2.55,
135      "cost_per_1m_in_cached": 0.475,
136      "cost_per_1m_out_cached": 0,
137      "context_window": 202752,
138      "default_max_tokens": 65535,
139      "can_reason": true,
140      "reasoning_levels": [
141        "low",
142        "medium",
143        "high"
144      ],
145      "default_reasoning_effort": "medium",
146      "supports_attachments": false
147    },
148    {
149      "id": "zai-org/GLM-5-Turbo",
150      "name": "GLM-5-Turbo",
151      "cost_per_1m_in": 0.4891,
152      "cost_per_1m_out": 1.9565,
153      "cost_per_1m_in_cached": 0.24455,
154      "cost_per_1m_out_cached": 0,
155      "context_window": 202752,
156      "default_max_tokens": 65535,
157      "can_reason": true,
158      "reasoning_levels": [
159        "low",
160        "medium",
161        "high"
162      ],
163      "default_reasoning_effort": "medium",
164      "supports_attachments": false
165    },
166    {
167      "id": "zai-org/GLM-5.1-TEE",
168      "name": "GLM-5.1-TEE",
169      "cost_per_1m_in": 1.05,
170      "cost_per_1m_out": 3.5,
171      "cost_per_1m_in_cached": 0.525,
172      "cost_per_1m_out_cached": 0,
173      "context_window": 202752,
174      "default_max_tokens": 65535,
175      "can_reason": true,
176      "reasoning_levels": [
177        "low",
178        "medium",
179        "high"
180      ],
181      "default_reasoning_effort": "medium",
182      "supports_attachments": false
183    },
184    {
185      "id": "NousResearch/Hermes-4-14B",
186      "name": "Hermes-4-14B",
187      "cost_per_1m_in": 0.0136,
188      "cost_per_1m_out": 0.0543,
189      "cost_per_1m_in_cached": 0.0068,
190      "cost_per_1m_out_cached": 0,
191      "context_window": 40960,
192      "default_max_tokens": 40960,
193      "can_reason": true,
194      "reasoning_levels": [
195        "low",
196        "medium",
197        "high"
198      ],
199      "default_reasoning_effort": "medium",
200      "supports_attachments": false
201    },
202    {
203      "id": "moonshotai/Kimi-K2.5-TEE",
204      "name": "Kimi-K2.5-TEE",
205      "cost_per_1m_in": 0.44,
206      "cost_per_1m_out": 2,
207      "cost_per_1m_in_cached": 0.22,
208      "cost_per_1m_out_cached": 0,
209      "context_window": 262144,
210      "default_max_tokens": 65535,
211      "can_reason": true,
212      "reasoning_levels": [
213        "low",
214        "medium",
215        "high"
216      ],
217      "default_reasoning_effort": "medium",
218      "supports_attachments": true
219    },
220    {
221      "id": "moonshotai/Kimi-K2.6-TEE",
222      "name": "Kimi-K2.6-TEE",
223      "cost_per_1m_in": 0.95,
224      "cost_per_1m_out": 4,
225      "cost_per_1m_in_cached": 0.475,
226      "cost_per_1m_out_cached": 0,
227      "context_window": 262144,
228      "default_max_tokens": 65535,
229      "can_reason": true,
230      "reasoning_levels": [
231        "low",
232        "medium",
233        "high"
234      ],
235      "default_reasoning_effort": "medium",
236      "supports_attachments": true
237    },
238    {
239      "id": "XiaomiMiMo/MiMo-V2-Flash-TEE",
240      "name": "MiMo-V2-Flash-TEE",
241      "cost_per_1m_in": 0.09,
242      "cost_per_1m_out": 0.29,
243      "cost_per_1m_in_cached": 0.045,
244      "cost_per_1m_out_cached": 0,
245      "context_window": 262144,
246      "default_max_tokens": 65536,
247      "can_reason": false,
248      "supports_attachments": false
249    },
250    {
251      "id": "MiniMaxAI/MiniMax-M2.5-TEE",
252      "name": "MiniMax-M2.5-TEE",
253      "cost_per_1m_in": 0.15,
254      "cost_per_1m_out": 1.2,
255      "cost_per_1m_in_cached": 0.075,
256      "cost_per_1m_out_cached": 0,
257      "context_window": 196608,
258      "default_max_tokens": 65536,
259      "can_reason": true,
260      "reasoning_levels": [
261        "low",
262        "medium",
263        "high"
264      ],
265      "default_reasoning_effort": "medium",
266      "supports_attachments": false
267    },
268    {
269      "id": "Qwen/Qwen3-235B-A22B-Thinking-2507",
270      "name": "Qwen3-235B-A22B-Thinking-2507",
271      "cost_per_1m_in": 0.11,
272      "cost_per_1m_out": 0.6,
273      "cost_per_1m_in_cached": 0.055,
274      "cost_per_1m_out_cached": 0,
275      "context_window": 262144,
276      "default_max_tokens": 262144,
277      "can_reason": true,
278      "reasoning_levels": [
279        "low",
280        "medium",
281        "high"
282      ],
283      "default_reasoning_effort": "medium",
284      "supports_attachments": false
285    },
286    {
287      "id": "Qwen/Qwen3-32B-TEE",
288      "name": "Qwen3-32B-TEE",
289      "cost_per_1m_in": 0.08,
290      "cost_per_1m_out": 0.24,
291      "cost_per_1m_in_cached": 0.04,
292      "cost_per_1m_out_cached": 0,
293      "context_window": 40960,
294      "default_max_tokens": 40960,
295      "can_reason": true,
296      "reasoning_levels": [
297        "low",
298        "medium",
299        "high"
300      ],
301      "default_reasoning_effort": "medium",
302      "supports_attachments": false
303    },
304    {
305      "id": "Qwen/Qwen3-Next-80B-A3B-Instruct",
306      "name": "Qwen3-Next-80B-A3B-Instruct",
307      "cost_per_1m_in": 0.1,
308      "cost_per_1m_out": 0.8,
309      "cost_per_1m_in_cached": 0.05,
310      "cost_per_1m_out_cached": 0,
311      "context_window": 262144,
312      "default_max_tokens": 262144,
313      "can_reason": false,
314      "supports_attachments": false
315    },
316    {
317      "id": "Qwen/Qwen3.5-397B-A17B-TEE",
318      "name": "Qwen3.5-397B-A17B-TEE",
319      "cost_per_1m_in": 0.39,
320      "cost_per_1m_out": 2.34,
321      "cost_per_1m_in_cached": 0.195,
322      "cost_per_1m_out_cached": 0,
323      "context_window": 262144,
324      "default_max_tokens": 65536,
325      "can_reason": true,
326      "reasoning_levels": [
327        "low",
328        "medium",
329        "high"
330      ],
331      "default_reasoning_effort": "medium",
332      "supports_attachments": true
333    },
334    {
335      "id": "Qwen/Qwen3.6-27B-TEE",
336      "name": "Qwen3.6-27B-TEE",
337      "cost_per_1m_in": 0.5,
338      "cost_per_1m_out": 2,
339      "cost_per_1m_in_cached": 0.25,
340      "cost_per_1m_out_cached": 0,
341      "context_window": 262144,
342      "default_max_tokens": 65536,
343      "can_reason": true,
344      "reasoning_levels": [
345        "low",
346        "medium",
347        "high"
348      ],
349      "default_reasoning_effort": "medium",
350      "supports_attachments": true
351    },
352    {
353      "id": "google/gemma-4-31B-turbo-TEE",
354      "name": "gemma-4-31B-turbo-TEE",
355      "cost_per_1m_in": 0.13,
356      "cost_per_1m_out": 0.38,
357      "cost_per_1m_in_cached": 0.065,
358      "cost_per_1m_out_cached": 0,
359      "context_window": 131072,
360      "default_max_tokens": 65536,
361      "can_reason": true,
362      "reasoning_levels": [
363        "low",
364        "medium",
365        "high"
366      ],
367      "default_reasoning_effort": "medium",
368      "supports_attachments": true
369    }
370  ]
371}