1{
2 "name": "Hugging Face",
3 "id": "huggingface",
4 "api_key": "$HF_TOKEN",
5 "api_endpoint": "https://router.huggingface.co/v1",
6 "type": "openai",
7 "default_large_model_id": "moonshotai/Kimi-K2-Instruct-0905:groq",
8 "default_small_model_id": "openai/gpt-oss-20b",
9 "models": [
10 {
11 "id": "Qwen/Qwen3-235B-A22B:fireworks-ai",
12 "name": "Qwen/Qwen3-235B-A22B (fireworks-ai)",
13 "cost_per_1m_in": 0.22,
14 "cost_per_1m_out": 0.88,
15 "cost_per_1m_in_cached": 0,
16 "cost_per_1m_out_cached": 0,
17 "context_window": 131072,
18 "default_max_tokens": 8192,
19 "can_reason": false,
20 "has_reasoning_efforts": false,
21 "supports_attachments": false
22 },
23 {
24 "id": "Qwen/Qwen3-235B-A22B-Instruct-2507:fireworks-ai",
25 "name": "Qwen/Qwen3-235B-A22B-Instruct-2507 (fireworks-ai)",
26 "cost_per_1m_in": 0.22,
27 "cost_per_1m_out": 0.88,
28 "cost_per_1m_in_cached": 0,
29 "cost_per_1m_out_cached": 0,
30 "context_window": 262144,
31 "default_max_tokens": 8192,
32 "can_reason": false,
33 "has_reasoning_efforts": false,
34 "supports_attachments": false
35 },
36 {
37 "id": "Qwen/Qwen3-235B-A22B-Thinking-2507:fireworks-ai",
38 "name": "Qwen/Qwen3-235B-A22B-Thinking-2507 (fireworks-ai)",
39 "cost_per_1m_in": 0.22,
40 "cost_per_1m_out": 0.88,
41 "cost_per_1m_in_cached": 0,
42 "cost_per_1m_out_cached": 0,
43 "context_window": 262144,
44 "default_max_tokens": 8192,
45 "can_reason": false,
46 "has_reasoning_efforts": false,
47 "supports_attachments": false
48 },
49 {
50 "id": "Qwen/Qwen3-30B-A3B:fireworks-ai",
51 "name": "Qwen/Qwen3-30B-A3B (fireworks-ai)",
52 "cost_per_1m_in": 0.15,
53 "cost_per_1m_out": 0.6,
54 "cost_per_1m_in_cached": 0,
55 "cost_per_1m_out_cached": 0,
56 "context_window": 131072,
57 "default_max_tokens": 8192,
58 "can_reason": false,
59 "has_reasoning_efforts": false,
60 "supports_attachments": false
61 },
62 {
63 "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct:cerebras",
64 "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct (cerebras)",
65 "cost_per_1m_in": 2,
66 "cost_per_1m_out": 2,
67 "cost_per_1m_in_cached": 0,
68 "cost_per_1m_out_cached": 0,
69 "context_window": 262144,
70 "default_max_tokens": 8192,
71 "can_reason": false,
72 "has_reasoning_efforts": false,
73 "supports_attachments": false
74 },
75 {
76 "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct:fireworks-ai",
77 "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct (fireworks-ai)",
78 "cost_per_1m_in": 0.45,
79 "cost_per_1m_out": 1.8,
80 "cost_per_1m_in_cached": 0,
81 "cost_per_1m_out_cached": 0,
82 "context_window": 262144,
83 "default_max_tokens": 8192,
84 "can_reason": false,
85 "has_reasoning_efforts": false,
86 "supports_attachments": false
87 },
88 {
89 "id": "deepseek-ai/DeepSeek-V3-0324:fireworks-ai",
90 "name": "deepseek-ai/DeepSeek-V3-0324 (fireworks-ai)",
91 "cost_per_1m_in": 0.9,
92 "cost_per_1m_out": 0.9,
93 "cost_per_1m_in_cached": 0,
94 "cost_per_1m_out_cached": 0,
95 "context_window": 163840,
96 "default_max_tokens": 8192,
97 "can_reason": false,
98 "has_reasoning_efforts": false,
99 "supports_attachments": false
100 },
101 {
102 "id": "deepseek-ai/DeepSeek-V3.1:fireworks-ai",
103 "name": "deepseek-ai/DeepSeek-V3.1 (fireworks-ai)",
104 "cost_per_1m_in": 0,
105 "cost_per_1m_out": 0,
106 "cost_per_1m_in_cached": 0,
107 "cost_per_1m_out_cached": 0,
108 "context_window": 163840,
109 "default_max_tokens": 8192,
110 "can_reason": false,
111 "has_reasoning_efforts": false,
112 "supports_attachments": false
113 },
114 {
115 "id": "meta-llama/Llama-3.1-70B-Instruct:fireworks-ai",
116 "name": "meta-llama/Llama-3.1-70B-Instruct (fireworks-ai)",
117 "cost_per_1m_in": 0.9,
118 "cost_per_1m_out": 0.9,
119 "cost_per_1m_in_cached": 0,
120 "cost_per_1m_out_cached": 0,
121 "context_window": 131072,
122 "default_max_tokens": 8192,
123 "can_reason": false,
124 "has_reasoning_efforts": false,
125 "supports_attachments": false
126 },
127 {
128 "id": "meta-llama/Llama-3.3-70B-Instruct:cerebras",
129 "name": "meta-llama/Llama-3.3-70B-Instruct (cerebras)",
130 "cost_per_1m_in": 0.85,
131 "cost_per_1m_out": 1.2,
132 "cost_per_1m_in_cached": 0,
133 "cost_per_1m_out_cached": 0,
134 "context_window": 131072,
135 "default_max_tokens": 8192,
136 "can_reason": false,
137 "has_reasoning_efforts": false,
138 "supports_attachments": false
139 },
140 {
141 "id": "meta-llama/Llama-3.3-70B-Instruct:groq",
142 "name": "meta-llama/Llama-3.3-70B-Instruct (groq)",
143 "cost_per_1m_in": 0.59,
144 "cost_per_1m_out": 0.79,
145 "cost_per_1m_in_cached": 0,
146 "cost_per_1m_out_cached": 0,
147 "context_window": 131072,
148 "default_max_tokens": 8192,
149 "can_reason": false,
150 "has_reasoning_efforts": false,
151 "supports_attachments": false
152 },
153 {
154 "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct:fireworks-ai",
155 "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct (fireworks-ai)",
156 "cost_per_1m_in": 0.22,
157 "cost_per_1m_out": 0.88,
158 "cost_per_1m_in_cached": 0,
159 "cost_per_1m_out_cached": 0,
160 "context_window": 1048576,
161 "default_max_tokens": 8192,
162 "can_reason": false,
163 "has_reasoning_efforts": false,
164 "supports_attachments": false
165 },
166 {
167 "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct:groq",
168 "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct (groq)",
169 "cost_per_1m_in": 0.2,
170 "cost_per_1m_out": 0.6,
171 "cost_per_1m_in_cached": 0,
172 "cost_per_1m_out_cached": 0,
173 "context_window": 131072,
174 "default_max_tokens": 8192,
175 "can_reason": false,
176 "has_reasoning_efforts": false,
177 "supports_attachments": false
178 },
179 {
180 "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct:groq",
181 "name": "meta-llama/Llama-4-Scout-17B-16E-Instruct (groq)",
182 "cost_per_1m_in": 0.11,
183 "cost_per_1m_out": 0.34,
184 "cost_per_1m_in_cached": 0,
185 "cost_per_1m_out_cached": 0,
186 "context_window": 131072,
187 "default_max_tokens": 8192,
188 "can_reason": false,
189 "has_reasoning_efforts": false,
190 "supports_attachments": false
191 },
192 {
193 "id": "moonshotai/Kimi-K2-Instruct:fireworks-ai",
194 "name": "moonshotai/Kimi-K2-Instruct (fireworks-ai)",
195 "cost_per_1m_in": 0.6,
196 "cost_per_1m_out": 2.5,
197 "cost_per_1m_in_cached": 0,
198 "cost_per_1m_out_cached": 0,
199 "context_window": 131072,
200 "default_max_tokens": 8192,
201 "can_reason": false,
202 "has_reasoning_efforts": false,
203 "supports_attachments": false
204 },
205 {
206 "id": "moonshotai/Kimi-K2-Instruct-0905:groq",
207 "name": "moonshotai/Kimi-K2-Instruct-0905 (groq)",
208 "cost_per_1m_in": 0,
209 "cost_per_1m_out": 0,
210 "cost_per_1m_in_cached": 0,
211 "cost_per_1m_out_cached": 0,
212 "context_window": 262144,
213 "default_max_tokens": 8192,
214 "can_reason": false,
215 "has_reasoning_efforts": false,
216 "supports_attachments": false
217 },
218 {
219 "id": "openai/gpt-oss-120b:cerebras",
220 "name": "openai/gpt-oss-120b (cerebras)",
221 "cost_per_1m_in": 0.25,
222 "cost_per_1m_out": 0.69,
223 "cost_per_1m_in_cached": 0,
224 "cost_per_1m_out_cached": 0,
225 "context_window": 131072,
226 "default_max_tokens": 8192,
227 "can_reason": false,
228 "has_reasoning_efforts": false,
229 "supports_attachments": false
230 },
231 {
232 "id": "openai/gpt-oss-120b:fireworks-ai",
233 "name": "openai/gpt-oss-120b (fireworks-ai)",
234 "cost_per_1m_in": 0.15,
235 "cost_per_1m_out": 0.6,
236 "cost_per_1m_in_cached": 0,
237 "cost_per_1m_out_cached": 0,
238 "context_window": 131072,
239 "default_max_tokens": 8192,
240 "can_reason": false,
241 "has_reasoning_efforts": false,
242 "supports_attachments": false
243 },
244 {
245 "id": "openai/gpt-oss-120b:groq",
246 "name": "openai/gpt-oss-120b (groq)",
247 "cost_per_1m_in": 0.15,
248 "cost_per_1m_out": 0.75,
249 "cost_per_1m_in_cached": 0,
250 "cost_per_1m_out_cached": 0,
251 "context_window": 131072,
252 "default_max_tokens": 8192,
253 "can_reason": false,
254 "has_reasoning_efforts": false,
255 "supports_attachments": false
256 },
257 {
258 "id": "openai/gpt-oss-20b:fireworks-ai",
259 "name": "openai/gpt-oss-20b (fireworks-ai)",
260 "cost_per_1m_in": 0.05,
261 "cost_per_1m_out": 0.2,
262 "cost_per_1m_in_cached": 0,
263 "cost_per_1m_out_cached": 0,
264 "context_window": 131072,
265 "default_max_tokens": 8192,
266 "can_reason": false,
267 "has_reasoning_efforts": false,
268 "supports_attachments": false
269 },
270 {
271 "id": "openai/gpt-oss-20b:groq",
272 "name": "openai/gpt-oss-20b (groq)",
273 "cost_per_1m_in": 0.1,
274 "cost_per_1m_out": 0.5,
275 "cost_per_1m_in_cached": 0,
276 "cost_per_1m_out_cached": 0,
277 "context_window": 131072,
278 "default_max_tokens": 8192,
279 "can_reason": false,
280 "has_reasoning_efforts": false,
281 "supports_attachments": false
282 },
283 {
284 "id": "zai-org/GLM-4.5:fireworks-ai",
285 "name": "zai-org/GLM-4.5 (fireworks-ai)",
286 "cost_per_1m_in": 0.55,
287 "cost_per_1m_out": 2.19,
288 "cost_per_1m_in_cached": 0,
289 "cost_per_1m_out_cached": 0,
290 "context_window": 131072,
291 "default_max_tokens": 8192,
292 "can_reason": false,
293 "has_reasoning_efforts": false,
294 "supports_attachments": false
295 },
296 {
297 "id": "zai-org/GLM-4.5-Air:fireworks-ai",
298 "name": "zai-org/GLM-4.5-Air (fireworks-ai)",
299 "cost_per_1m_in": 0.22,
300 "cost_per_1m_out": 0.88,
301 "cost_per_1m_in_cached": 0,
302 "cost_per_1m_out_cached": 0,
303 "context_window": 131072,
304 "default_max_tokens": 8192,
305 "can_reason": false,
306 "has_reasoning_efforts": false,
307 "supports_attachments": false
308 }
309 ],
310 "default_headers": {
311 "HTTP-Referer": "https://charm.land",
312 "X-Title": "Crush"
313 }
314}