huggingface.json

  1{
  2  "name": "Hugging Face",
  3  "id": "huggingface",
  4  "api_key": "$HF_TOKEN",
  5  "api_endpoint": "https://router.huggingface.co/v1",
  6  "type": "openai-compat",
  7  "default_large_model_id": "moonshotai/Kimi-K2-Instruct-0905:groq",
  8  "default_small_model_id": "openai/gpt-oss-20b",
  9  "models": [
 10    {
 11      "id": "Qwen/Qwen3-235B-A22B:fireworks-ai",
 12      "name": "Qwen/Qwen3-235B-A22B (fireworks-ai)",
 13      "cost_per_1m_in": 0.22,
 14      "cost_per_1m_out": 0.88,
 15      "cost_per_1m_in_cached": 0,
 16      "cost_per_1m_out_cached": 0,
 17      "context_window": 131072,
 18      "default_max_tokens": 8192,
 19      "can_reason": false,
 20      "has_reasoning_efforts": false,
 21      "supports_attachments": false
 22    },
 23    {
 24      "id": "Qwen/Qwen3-235B-A22B-Instruct-2507:fireworks-ai",
 25      "name": "Qwen/Qwen3-235B-A22B-Instruct-2507 (fireworks-ai)",
 26      "cost_per_1m_in": 0.22,
 27      "cost_per_1m_out": 0.88,
 28      "cost_per_1m_in_cached": 0,
 29      "cost_per_1m_out_cached": 0,
 30      "context_window": 262144,
 31      "default_max_tokens": 8192,
 32      "can_reason": false,
 33      "has_reasoning_efforts": false,
 34      "supports_attachments": false
 35    },
 36    {
 37      "id": "Qwen/Qwen3-235B-A22B-Thinking-2507:fireworks-ai",
 38      "name": "Qwen/Qwen3-235B-A22B-Thinking-2507 (fireworks-ai)",
 39      "cost_per_1m_in": 0.22,
 40      "cost_per_1m_out": 0.88,
 41      "cost_per_1m_in_cached": 0,
 42      "cost_per_1m_out_cached": 0,
 43      "context_window": 262144,
 44      "default_max_tokens": 8192,
 45      "can_reason": false,
 46      "has_reasoning_efforts": false,
 47      "supports_attachments": false
 48    },
 49    {
 50      "id": "Qwen/Qwen3-30B-A3B:fireworks-ai",
 51      "name": "Qwen/Qwen3-30B-A3B (fireworks-ai)",
 52      "cost_per_1m_in": 0.15,
 53      "cost_per_1m_out": 0.6,
 54      "cost_per_1m_in_cached": 0,
 55      "cost_per_1m_out_cached": 0,
 56      "context_window": 131072,
 57      "default_max_tokens": 8192,
 58      "can_reason": false,
 59      "has_reasoning_efforts": false,
 60      "supports_attachments": false
 61    },
 62    {
 63      "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct:cerebras",
 64      "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct (cerebras)",
 65      "cost_per_1m_in": 2,
 66      "cost_per_1m_out": 2,
 67      "cost_per_1m_in_cached": 0,
 68      "cost_per_1m_out_cached": 0,
 69      "context_window": 262144,
 70      "default_max_tokens": 8192,
 71      "can_reason": false,
 72      "has_reasoning_efforts": false,
 73      "supports_attachments": false
 74    },
 75    {
 76      "id": "Qwen/Qwen3-Coder-480B-A35B-Instruct:fireworks-ai",
 77      "name": "Qwen/Qwen3-Coder-480B-A35B-Instruct (fireworks-ai)",
 78      "cost_per_1m_in": 0.45,
 79      "cost_per_1m_out": 1.8,
 80      "cost_per_1m_in_cached": 0,
 81      "cost_per_1m_out_cached": 0,
 82      "context_window": 262144,
 83      "default_max_tokens": 8192,
 84      "can_reason": false,
 85      "has_reasoning_efforts": false,
 86      "supports_attachments": false
 87    },
 88    {
 89      "id": "deepseek-ai/DeepSeek-V3-0324:fireworks-ai",
 90      "name": "deepseek-ai/DeepSeek-V3-0324 (fireworks-ai)",
 91      "cost_per_1m_in": 0.9,
 92      "cost_per_1m_out": 0.9,
 93      "cost_per_1m_in_cached": 0,
 94      "cost_per_1m_out_cached": 0,
 95      "context_window": 163840,
 96      "default_max_tokens": 8192,
 97      "can_reason": false,
 98      "has_reasoning_efforts": false,
 99      "supports_attachments": false
100    },
101    {
102      "id": "deepseek-ai/DeepSeek-V3.1:fireworks-ai",
103      "name": "deepseek-ai/DeepSeek-V3.1 (fireworks-ai)",
104      "cost_per_1m_in": 0,
105      "cost_per_1m_out": 0,
106      "cost_per_1m_in_cached": 0,
107      "cost_per_1m_out_cached": 0,
108      "context_window": 163840,
109      "default_max_tokens": 8192,
110      "can_reason": false,
111      "has_reasoning_efforts": false,
112      "supports_attachments": false
113    },
114    {
115      "id": "meta-llama/Llama-3.1-70B-Instruct:fireworks-ai",
116      "name": "meta-llama/Llama-3.1-70B-Instruct (fireworks-ai)",
117      "cost_per_1m_in": 0.9,
118      "cost_per_1m_out": 0.9,
119      "cost_per_1m_in_cached": 0,
120      "cost_per_1m_out_cached": 0,
121      "context_window": 131072,
122      "default_max_tokens": 8192,
123      "can_reason": false,
124      "has_reasoning_efforts": false,
125      "supports_attachments": false
126    },
127    {
128      "id": "meta-llama/Llama-3.3-70B-Instruct:cerebras",
129      "name": "meta-llama/Llama-3.3-70B-Instruct (cerebras)",
130      "cost_per_1m_in": 0.85,
131      "cost_per_1m_out": 1.2,
132      "cost_per_1m_in_cached": 0,
133      "cost_per_1m_out_cached": 0,
134      "context_window": 131072,
135      "default_max_tokens": 8192,
136      "can_reason": false,
137      "has_reasoning_efforts": false,
138      "supports_attachments": false
139    },
140    {
141      "id": "meta-llama/Llama-3.3-70B-Instruct:groq",
142      "name": "meta-llama/Llama-3.3-70B-Instruct (groq)",
143      "cost_per_1m_in": 0.59,
144      "cost_per_1m_out": 0.79,
145      "cost_per_1m_in_cached": 0,
146      "cost_per_1m_out_cached": 0,
147      "context_window": 131072,
148      "default_max_tokens": 8192,
149      "can_reason": false,
150      "has_reasoning_efforts": false,
151      "supports_attachments": false
152    },
153    {
154      "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct:fireworks-ai",
155      "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct (fireworks-ai)",
156      "cost_per_1m_in": 0.22,
157      "cost_per_1m_out": 0.88,
158      "cost_per_1m_in_cached": 0,
159      "cost_per_1m_out_cached": 0,
160      "context_window": 1048576,
161      "default_max_tokens": 8192,
162      "can_reason": false,
163      "has_reasoning_efforts": false,
164      "supports_attachments": false
165    },
166    {
167      "id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct:groq",
168      "name": "meta-llama/Llama-4-Maverick-17B-128E-Instruct (groq)",
169      "cost_per_1m_in": 0.2,
170      "cost_per_1m_out": 0.6,
171      "cost_per_1m_in_cached": 0,
172      "cost_per_1m_out_cached": 0,
173      "context_window": 131072,
174      "default_max_tokens": 8192,
175      "can_reason": false,
176      "has_reasoning_efforts": false,
177      "supports_attachments": false
178    },
179    {
180      "id": "meta-llama/Llama-4-Scout-17B-16E-Instruct:groq",
181      "name": "meta-llama/Llama-4-Scout-17B-16E-Instruct (groq)",
182      "cost_per_1m_in": 0.11,
183      "cost_per_1m_out": 0.34,
184      "cost_per_1m_in_cached": 0,
185      "cost_per_1m_out_cached": 0,
186      "context_window": 131072,
187      "default_max_tokens": 8192,
188      "can_reason": false,
189      "has_reasoning_efforts": false,
190      "supports_attachments": false
191    },
192    {
193      "id": "moonshotai/Kimi-K2-Instruct:fireworks-ai",
194      "name": "moonshotai/Kimi-K2-Instruct (fireworks-ai)",
195      "cost_per_1m_in": 0.6,
196      "cost_per_1m_out": 2.5,
197      "cost_per_1m_in_cached": 0,
198      "cost_per_1m_out_cached": 0,
199      "context_window": 131072,
200      "default_max_tokens": 8192,
201      "can_reason": false,
202      "has_reasoning_efforts": false,
203      "supports_attachments": false
204    },
205    {
206      "id": "moonshotai/Kimi-K2-Instruct-0905:groq",
207      "name": "moonshotai/Kimi-K2-Instruct-0905 (groq)",
208      "cost_per_1m_in": 0,
209      "cost_per_1m_out": 0,
210      "cost_per_1m_in_cached": 0,
211      "cost_per_1m_out_cached": 0,
212      "context_window": 262144,
213      "default_max_tokens": 8192,
214      "can_reason": false,
215      "has_reasoning_efforts": false,
216      "supports_attachments": false
217    },
218    {
219      "id": "openai/gpt-oss-120b:cerebras",
220      "name": "openai/gpt-oss-120b (cerebras)",
221      "cost_per_1m_in": 0.25,
222      "cost_per_1m_out": 0.69,
223      "cost_per_1m_in_cached": 0,
224      "cost_per_1m_out_cached": 0,
225      "context_window": 131072,
226      "default_max_tokens": 8192,
227      "can_reason": false,
228      "has_reasoning_efforts": false,
229      "supports_attachments": false
230    },
231    {
232      "id": "openai/gpt-oss-120b:fireworks-ai",
233      "name": "openai/gpt-oss-120b (fireworks-ai)",
234      "cost_per_1m_in": 0.15,
235      "cost_per_1m_out": 0.6,
236      "cost_per_1m_in_cached": 0,
237      "cost_per_1m_out_cached": 0,
238      "context_window": 131072,
239      "default_max_tokens": 8192,
240      "can_reason": false,
241      "has_reasoning_efforts": false,
242      "supports_attachments": false
243    },
244    {
245      "id": "openai/gpt-oss-120b:groq",
246      "name": "openai/gpt-oss-120b (groq)",
247      "cost_per_1m_in": 0.15,
248      "cost_per_1m_out": 0.75,
249      "cost_per_1m_in_cached": 0,
250      "cost_per_1m_out_cached": 0,
251      "context_window": 131072,
252      "default_max_tokens": 8192,
253      "can_reason": false,
254      "has_reasoning_efforts": false,
255      "supports_attachments": false
256    },
257    {
258      "id": "openai/gpt-oss-20b:fireworks-ai",
259      "name": "openai/gpt-oss-20b (fireworks-ai)",
260      "cost_per_1m_in": 0.05,
261      "cost_per_1m_out": 0.2,
262      "cost_per_1m_in_cached": 0,
263      "cost_per_1m_out_cached": 0,
264      "context_window": 131072,
265      "default_max_tokens": 8192,
266      "can_reason": false,
267      "has_reasoning_efforts": false,
268      "supports_attachments": false
269    },
270    {
271      "id": "openai/gpt-oss-20b:groq",
272      "name": "openai/gpt-oss-20b (groq)",
273      "cost_per_1m_in": 0.1,
274      "cost_per_1m_out": 0.5,
275      "cost_per_1m_in_cached": 0,
276      "cost_per_1m_out_cached": 0,
277      "context_window": 131072,
278      "default_max_tokens": 8192,
279      "can_reason": false,
280      "has_reasoning_efforts": false,
281      "supports_attachments": false
282    },
283    {
284      "id": "zai-org/GLM-4.5:fireworks-ai",
285      "name": "zai-org/GLM-4.5 (fireworks-ai)",
286      "cost_per_1m_in": 0.55,
287      "cost_per_1m_out": 2.19,
288      "cost_per_1m_in_cached": 0,
289      "cost_per_1m_out_cached": 0,
290      "context_window": 131072,
291      "default_max_tokens": 8192,
292      "can_reason": false,
293      "has_reasoning_efforts": false,
294      "supports_attachments": false
295    },
296    {
297      "id": "zai-org/GLM-4.5-Air:fireworks-ai",
298      "name": "zai-org/GLM-4.5-Air (fireworks-ai)",
299      "cost_per_1m_in": 0.22,
300      "cost_per_1m_out": 0.88,
301      "cost_per_1m_in_cached": 0,
302      "cost_per_1m_out_cached": 0,
303      "context_window": 131072,
304      "default_max_tokens": 8192,
305      "can_reason": false,
306      "has_reasoning_efforts": false,
307      "supports_attachments": false
308    }
309  ],
310  "default_headers": {
311    "HTTP-Referer": "https://charm.land",
312    "X-Title": "Crush"
313  }
314}