1{
  2  "name": "Chutes",
  3  "id": "chutes",
  4  "type": "openai",
  5  "api_key": "$CHUTES_API_KEY",
  6  "api_endpoint": "https://llm.chutes.ai/v1",
  7  "default_large_model_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
  8  "default_small_model_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
  9  "models": [
 10    {
 11      "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
 12      "name": "Qwen3 Coder 480B A35B Instruct (FP8)",
 13      "cost_per_1m_in": 0.2,
 14      "cost_per_1m_out": 0.8,
 15      "context_window": 262000,
 16      "default_max_tokens": 32768,
 17      "can_reason": true,
 18      "has_reasoning_efforts": true,
 19      "default_reasoning_efforts": "medium",
 20      "supports_attachments": true
 21    },
 22    {
 23      "id": "zai-org/GLM-4.5-FP8",
 24      "name": "GLM 4.5 FP8",
 25      "cost_per_1m_in": 0.0,
 26      "cost_per_1m_out": 0.0,
 27      "context_window": 98000,
 28      "default_max_tokens": 32768,
 29      "can_reason": true,
 30      "has_reasoning_efforts": true,
 31      "default_reasoning_efforts": "medium",
 32      "supports_attachments": true
 33    },
 34    {
 35      "id": "moonshotai/Kimi-K2-Instruct-75k",
 36      "name": "Kimi K2 Instruct",
 37      "cost_per_1m_in": 0.15,
 38      "cost_per_1m_out": 0.59,
 39      "context_window": 75000,
 40      "default_max_tokens": 32768,
 41      "can_reason": true,
 42      "has_reasoning_efforts": true,
 43      "default_reasoning_efforts": "medium",
 44      "supports_attachments": true
 45    },
 46    {
 47      "id": "deepseek-ai/DeepSeek-R1-0528",
 48      "name": "DeepSeek R1 0528",
 49      "cost_per_1m_in": 0.18,
 50      "cost_per_1m_out": 0.72,
 51      "context_window": 75000,
 52      "default_max_tokens": 32768,
 53      "can_reason": true,
 54      "has_reasoning_efforts": true,
 55      "default_reasoning_efforts": "medium",
 56      "supports_attachments": true
 57    },
 58    {
 59      "id": "deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
 60      "name": "DeepSeek R1 0528 Qwen3 8B",
 61      "cost_per_1m_in": 0.02,
 62      "cost_per_1m_out": 0.07,
 63      "context_window": 32768,
 64      "default_max_tokens": 8192,
 65      "can_reason": false,
 66      "has_reasoning_efforts": false,
 67      "supports_attachments": true
 68    },
 69    {
 70      "id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
 71      "name": "DeepSeek R1 Distill Llama 70B",
 72      "cost_per_1m_in": 0.03,
 73      "cost_per_1m_out": 0.14,
 74      "context_window": 65536,
 75      "default_max_tokens": 8192,
 76      "can_reason": false,
 77      "has_reasoning_efforts": false,
 78      "supports_attachments": true
 79    },
 80    {
 81      "id": "tngtech/DeepSeek-R1T-Chimera",
 82      "name": "DeepSeek R1T Chimera",
 83      "cost_per_1m_in": 0.18,
 84      "cost_per_1m_out": 0.72,
 85      "context_window": 131072,
 86      "default_max_tokens": 32768,
 87      "can_reason": true,
 88      "has_reasoning_efforts": true,
 89      "default_reasoning_efforts": "medium",
 90      "supports_attachments": true
 91    },
 92    {
 93      "id": "tngtech/DeepSeek-TNG-R1T2-Chimera",
 94      "name": "DeepSeek TNG R1T2 Chimera",
 95      "cost_per_1m_in": 0.20,
 96      "cost_per_1m_out": 0.80,
 97      "context_window": 262144,
 98      "default_max_tokens": 65536,
 99      "can_reason": true,
100      "has_reasoning_efforts": true,
101      "default_reasoning_efforts": "high",
102      "supports_attachments": true
103    },
104    {
105      "id": "deepseek-ai/DeepSeek-V3-0324",
106      "name": "DeepSeek V3 0324",
107      "cost_per_1m_in": 0.18,
108      "cost_per_1m_out": 0.72,
109      "context_window": 75000,
110      "default_max_tokens": 32768,
111      "can_reason": true,
112      "has_reasoning_efforts": true,
113      "default_reasoning_efforts": "medium",
114      "supports_attachments": true
115    },
116    {
117      "id": "chutesai/Devstral-Small-2505",
118      "name": "Devstral Small 2505",
119      "cost_per_1m_in": 0.02,
120      "cost_per_1m_out": 0.08,
121      "context_window": 32768,
122      "default_max_tokens": 8192,
123      "can_reason": false,
124      "has_reasoning_efforts": false,
125      "supports_attachments": true
126    },
127    {
128      "id": "zai-org/GLM-4.5-Air",
129      "name": "GLM 4.5 Air",
130      "cost_per_1m_in": 0.0,
131      "cost_per_1m_out": 0.0,
132      "context_window": 131072,
133      "default_max_tokens": 32768,
134      "can_reason": true,
135      "has_reasoning_efforts": true,
136      "default_reasoning_efforts": "medium",
137      "supports_attachments": true
138    },
139    {
140      "id": "openai/gpt-oss-120b",
141      "name": "GPT OSS 120B",
142      "cost_per_1m_in": 0.10,
143      "cost_per_1m_out": 0.41,
144      "context_window": 131072,
145      "default_max_tokens": 32768,
146      "can_reason": true,
147      "has_reasoning_efforts": true,
148      "default_reasoning_efforts": "medium",
149      "supports_attachments": true
150    },
151    {
152      "id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
153      "name": "Mistral Small 3.2 24B Instruct 2506",
154      "cost_per_1m_in": 0.02,
155      "cost_per_1m_out": 0.08,
156      "context_window": 32768,
157      "default_max_tokens": 8192,
158      "can_reason": false,
159      "has_reasoning_efforts": false,
160      "supports_attachments": true
161    },
162    {
163      "id": "Qwen/Qwen3-235B-A22B-Instruct-2507",
164      "name": "Qwen3 235B A22B Instruct 2507",
165      "cost_per_1m_in": 0.08,
166      "cost_per_1m_out": 0.31,
167      "context_window": 32768,
168      "default_max_tokens": 8192,
169      "can_reason": false,
170      "has_reasoning_efforts": false,
171      "supports_attachments": true
172    },
173    {
174      "id": "Qwen/Qwen3-30B-A3B",
175      "name": "Qwen3 30B A3B",
176      "cost_per_1m_in": 0.02,
177      "cost_per_1m_out": 0.08,
178      "context_window": 32768,
179      "default_max_tokens": 8192,
180      "can_reason": false,
181      "has_reasoning_efforts": false,
182      "supports_attachments": true
183    },
184    {
185      "id": "Qwen/Qwen3-235B-A22B-Thinking-2507",
186      "name": "Qwen3 235B A22B Thinking 2507",
187      "cost_per_1m_in": 0.08,
188      "cost_per_1m_out": 0.31,
189      "context_window": 32768,
190      "default_max_tokens": 8192,
191      "can_reason": true,
192      "has_reasoning_efforts": true,
193      "default_reasoning_efforts": "high",
194      "supports_attachments": true
195    },
196    {
197      "id": "deepseek-ai/DeepSeek-V3.1",
198      "name": "DeepSeek V3.1",
199      "cost_per_1m_in": 0.20,
200      "cost_per_1m_out": 0.80,
201      "context_window": 163840,
202      "default_max_tokens": 32768,
203      "can_reason": false,
204      "has_reasoning_efforts": false,
205      "supports_attachments": true
206    },
207    {
208      "id": "deepseek-ai/DeepSeek-V3.1:THINKING",
209      "name": "DeepSeek V3.1 Reasoning",
210      "cost_per_1m_in": 0.20,
211      "cost_per_1m_out": 0.80,
212      "context_window": 163840,
213      "default_max_tokens": 32768,
214      "can_reason": true,
215      "has_reasoning_efforts": true,
216      "default_reasoning_efforts": "medium",
217      "supports_attachments": true
218    },
219    {
220      "id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
221      "name": "Qwen3 30B A3B Instruct 2507",
222      "cost_per_1m_in": 0.05,
223      "cost_per_1m_out": 0.20,
224      "context_window": 262144,
225      "default_max_tokens": 32768,
226      "can_reason": false,
227      "has_reasoning_efforts": false,
228      "supports_attachments": true
229    },
230    {
231      "id": "Qwen/Qwen3-Coder-30B-A3B-Instruct",
232      "name": "Qwen3 Coder 30B A3B Instruct",
233      "cost_per_1m_in": 0.00,
234      "cost_per_1m_out": 0.00,
235      "context_window": 262144,
236      "default_max_tokens": 32768,
237      "can_reason": false,
238      "has_reasoning_efforts": false,
239      "supports_attachments": true
240    }
241  ]
242}