groq.go

 1package models
 2
 3const (
 4	ProviderGROQ ModelProvider = "groq"
 5
 6	// GROQ
 7	QWENQwq ModelID = "qwen-qwq"
 8
 9	// GROQ preview models
10	Llama4Scout               ModelID = "meta-llama/llama-4-scout-17b-16e-instruct"
11	Llama4Maverick            ModelID = "meta-llama/llama-4-maverick-17b-128e-instruct"
12	Llama3_3_70BVersatile     ModelID = "llama-3.3-70b-versatile"
13	DeepseekR1DistillLlama70b ModelID = "deepseek-r1-distill-llama-70b"
14)
15
16var GroqModels = map[ModelID]Model{
17	//
18	// GROQ
19	QWENQwq: {
20		ID:                 QWENQwq,
21		Name:               "Qwen Qwq",
22		Provider:           ProviderGROQ,
23		APIModel:           "qwen-qwq-32b",
24		CostPer1MIn:        0.29,
25		CostPer1MInCached:  0.275,
26		CostPer1MOutCached: 0.0,
27		CostPer1MOut:       0.39,
28		ContextWindow:      128_000,
29		DefaultMaxTokens:   50000,
30		// for some reason, the groq api doesn't like the reasoningEffort parameter
31		CanReason: false,
32	},
33
34	Llama4Scout: {
35		ID:                 Llama4Scout,
36		Name:               "Llama4Scout",
37		Provider:           ProviderGROQ,
38		APIModel:           "meta-llama/llama-4-scout-17b-16e-instruct",
39		CostPer1MIn:        0.11,
40		CostPer1MInCached:  0,
41		CostPer1MOutCached: 0,
42		CostPer1MOut:       0.34,
43		ContextWindow:      128_000, // 10M when?
44	},
45
46	Llama4Maverick: {
47		ID:                 Llama4Maverick,
48		Name:               "Llama4Maverick",
49		Provider:           ProviderGROQ,
50		APIModel:           "meta-llama/llama-4-maverick-17b-128e-instruct",
51		CostPer1MIn:        0.20,
52		CostPer1MInCached:  0,
53		CostPer1MOutCached: 0,
54		CostPer1MOut:       0.20,
55		ContextWindow:      128_000,
56	},
57
58	Llama3_3_70BVersatile: {
59		ID:                 Llama3_3_70BVersatile,
60		Name:               "Llama3_3_70BVersatile",
61		Provider:           ProviderGROQ,
62		APIModel:           "llama-3.3-70b-versatile",
63		CostPer1MIn:        0.59,
64		CostPer1MInCached:  0,
65		CostPer1MOutCached: 0,
66		CostPer1MOut:       0.79,
67		ContextWindow:      128_000,
68	},
69
70	DeepseekR1DistillLlama70b: {
71		ID:                 DeepseekR1DistillLlama70b,
72		Name:               "DeepseekR1DistillLlama70b",
73		Provider:           ProviderGROQ,
74		APIModel:           "deepseek-r1-distill-llama-70b",
75		CostPer1MIn:        0.75,
76		CostPer1MInCached:  0,
77		CostPer1MOutCached: 0,
78		CostPer1MOut:       0.99,
79		ContextWindow:      128_000,
80		CanReason:          true,
81	},
82}