1package models
2
3const (
4 ProviderGROQ ModelProvider = "groq"
5
6 // GROQ
7 QWENQwq ModelID = "qwen-qwq"
8
9 // GROQ preview models
10 Llama4Scout ModelID = "meta-llama/llama-4-scout-17b-16e-instruct"
11 Llama4Maverick ModelID = "meta-llama/llama-4-maverick-17b-128e-instruct"
12 Llama3_3_70BVersatile ModelID = "llama-3.3-70b-versatile"
13 DeepseekR1DistillLlama70b ModelID = "deepseek-r1-distill-llama-70b"
14)
15
16var GroqModels = map[ModelID]Model{
17 //
18 // GROQ
19 QWENQwq: {
20 ID: QWENQwq,
21 Name: "Qwen Qwq",
22 Provider: ProviderGROQ,
23 APIModel: "qwen-qwq-32b",
24 CostPer1MIn: 0.29,
25 CostPer1MInCached: 0.275,
26 CostPer1MOutCached: 0.0,
27 CostPer1MOut: 0.39,
28 ContextWindow: 128_000,
29 DefaultMaxTokens: 50000,
30 // for some reason, the groq api doesn't like the reasoningEffort parameter
31 CanReason: false,
32 },
33
34 Llama4Scout: {
35 ID: Llama4Scout,
36 Name: "Llama4Scout",
37 Provider: ProviderGROQ,
38 APIModel: "meta-llama/llama-4-scout-17b-16e-instruct",
39 CostPer1MIn: 0.11,
40 CostPer1MInCached: 0,
41 CostPer1MOutCached: 0,
42 CostPer1MOut: 0.34,
43 ContextWindow: 128_000, // 10M when?
44 },
45
46 Llama4Maverick: {
47 ID: Llama4Maverick,
48 Name: "Llama4Maverick",
49 Provider: ProviderGROQ,
50 APIModel: "meta-llama/llama-4-maverick-17b-128e-instruct",
51 CostPer1MIn: 0.20,
52 CostPer1MInCached: 0,
53 CostPer1MOutCached: 0,
54 CostPer1MOut: 0.20,
55 ContextWindow: 128_000,
56 },
57
58 Llama3_3_70BVersatile: {
59 ID: Llama3_3_70BVersatile,
60 Name: "Llama3_3_70BVersatile",
61 Provider: ProviderGROQ,
62 APIModel: "llama-3.3-70b-versatile",
63 CostPer1MIn: 0.59,
64 CostPer1MInCached: 0,
65 CostPer1MOutCached: 0,
66 CostPer1MOut: 0.79,
67 ContextWindow: 128_000,
68 },
69
70 DeepseekR1DistillLlama70b: {
71 ID: DeepseekR1DistillLlama70b,
72 Name: "DeepseekR1DistillLlama70b",
73 Provider: ProviderGROQ,
74 APIModel: "deepseek-r1-distill-llama-70b",
75 CostPer1MIn: 0.75,
76 CostPer1MInCached: 0,
77 CostPer1MOutCached: 0,
78 CostPer1MOut: 0.99,
79 ContextWindow: 128_000,
80 CanReason: true,
81 },
82}