1{
2 "name": "Azure OpenAI",
3 "id": "azure",
4 "type": "azure",
5 "api_key": "$AZURE_OPENAI_API_KEY",
6 "api_endpoint": "$AZURE_OPENAI_API_ENDPOINT",
7 "default_large_model_id": "gpt-5",
8 "default_small_model_id": "gpt-5-mini",
9 "models": [
10 {
11 "id": "gpt-5",
12 "name": "GPT-5",
13 "cost_per_1m_in": 1.25,
14 "cost_per_1m_out": 10,
15 "cost_per_1m_in_cached": 0.25,
16 "cost_per_1m_out_cached": 0.25,
17 "context_window": 400000,
18 "default_max_tokens": 128000,
19 "can_reason": true,
20 "has_reasoning_efforts": false,
21 "default_reasoning_effort": "minimal",
22 "supports_attachments": true
23 },
24 {
25 "id": "gpt-5-mini",
26 "name": "GPT-5 Mini",
27 "cost_per_1m_in": 0.25,
28 "cost_per_1m_out": 2,
29 "cost_per_1m_in_cached": 0.025,
30 "cost_per_1m_out_cached": 0.025,
31 "context_window": 400000,
32 "default_max_tokens": 128000,
33 "can_reason": true,
34 "has_reasoning_efforts": false,
35 "default_reasoning_effort": "low",
36 "supports_attachments": true
37 },
38 {
39 "id": "gpt-5-nano",
40 "name": "GPT-5 Nano",
41 "cost_per_1m_in": 0.05,
42 "cost_per_1m_out": 0.4,
43 "cost_per_1m_in_cached": 0.005,
44 "cost_per_1m_out_cached": 0.005,
45 "context_window": 400000,
46 "default_max_tokens": 128000,
47 "can_reason": true,
48 "has_reasoning_efforts": false,
49 "default_reasoning_effort": "low",
50 "supports_attachments": true
51 },
52 {
53 "id": "codex-mini-latest",
54 "name": "Codex Mini",
55 "cost_per_1m_in": 1.5,
56 "cost_per_1m_out": 6,
57 "cost_per_1m_in_cached": 0,
58 "cost_per_1m_out_cached": 0.375,
59 "context_window": 200000,
60 "default_max_tokens": 50000,
61 "can_reason": true,
62 "has_reasoning_efforts": true,
63 "default_reasoning_effort": "medium",
64 "supports_attachments": true
65 },
66 {
67 "id": "o4-mini",
68 "name": "o4 Mini",
69 "cost_per_1m_in": 1.1,
70 "cost_per_1m_out": 4.4,
71 "cost_per_1m_in_cached": 0,
72 "cost_per_1m_out_cached": 0.275,
73 "context_window": 200000,
74 "default_max_tokens": 50000,
75 "can_reason": true,
76 "has_reasoning_efforts": true,
77 "default_reasoning_effort": "medium",
78 "supports_attachments": true
79 },
80 {
81 "id": "o3",
82 "name": "o3",
83 "cost_per_1m_in": 2,
84 "cost_per_1m_out": 8,
85 "cost_per_1m_in_cached": 0,
86 "cost_per_1m_out_cached": 0.5,
87 "context_window": 200000,
88 "default_max_tokens": 50000,
89 "can_reason": true,
90 "has_reasoning_efforts": true,
91 "default_reasoning_effort": "medium",
92 "supports_attachments": true
93 },
94 {
95 "id": "o3-pro",
96 "name": "o3 Pro",
97 "cost_per_1m_in": 20,
98 "cost_per_1m_out": 80,
99 "cost_per_1m_in_cached": 0,
100 "cost_per_1m_out_cached": 0,
101 "context_window": 200000,
102 "default_max_tokens": 50000,
103 "can_reason": true,
104 "has_reasoning_efforts": true,
105 "default_reasoning_effort": "medium",
106 "supports_attachments": true
107 },
108 {
109 "id": "gpt-4.1",
110 "name": "GPT-4.1",
111 "cost_per_1m_in": 2,
112 "cost_per_1m_out": 8,
113 "cost_per_1m_in_cached": 0,
114 "cost_per_1m_out_cached": 0.5,
115 "context_window": 1047576,
116 "default_max_tokens": 50000,
117 "can_reason": false,
118 "supports_attachments": true
119 },
120 {
121 "id": "gpt-4.1-mini",
122 "name": "GPT-4.1 Mini",
123 "cost_per_1m_in": 0.39999999999999997,
124 "cost_per_1m_out": 1.5999999999999999,
125 "cost_per_1m_in_cached": 0,
126 "cost_per_1m_out_cached": 0.09999999999999999,
127 "context_window": 1047576,
128 "default_max_tokens": 50000,
129 "can_reason": false,
130 "supports_attachments": true
131 },
132 {
133 "id": "gpt-4.1-nano",
134 "name": "GPT-4.1 Nano",
135 "cost_per_1m_in": 0.09999999999999999,
136 "cost_per_1m_out": 0.39999999999999997,
137 "cost_per_1m_in_cached": 0,
138 "cost_per_1m_out_cached": 0.024999999999999998,
139 "context_window": 1047576,
140 "default_max_tokens": 50000,
141 "can_reason": false,
142 "supports_attachments": true
143 },
144 {
145 "id": "gpt-4.5-preview",
146 "name": "GPT-4.5 (Preview)",
147 "cost_per_1m_in": 75,
148 "cost_per_1m_out": 150,
149 "cost_per_1m_in_cached": 0,
150 "cost_per_1m_out_cached": 37.5,
151 "context_window": 128000,
152 "default_max_tokens": 50000,
153 "can_reason": false,
154 "supports_attachments": true
155 },
156 {
157 "id": "o3-mini",
158 "name": "o3 Mini",
159 "cost_per_1m_in": 1.1,
160 "cost_per_1m_out": 4.4,
161 "cost_per_1m_in_cached": 0,
162 "cost_per_1m_out_cached": 0.55,
163 "context_window": 200000,
164 "default_max_tokens": 50000,
165 "can_reason": true,
166 "has_reasoning_efforts": true,
167 "default_reasoning_effort": "medium",
168 "supports_attachments": false
169 },
170 {
171 "id": "gpt-4o",
172 "name": "GPT-4o",
173 "cost_per_1m_in": 2.5,
174 "cost_per_1m_out": 10,
175 "cost_per_1m_in_cached": 0,
176 "cost_per_1m_out_cached": 1.25,
177 "context_window": 128000,
178 "default_max_tokens": 20000,
179 "can_reason": false,
180 "supports_attachments": true
181 },
182 {
183 "id": "gpt-4o-mini",
184 "name": "GPT-4o-mini",
185 "cost_per_1m_in": 0.15,
186 "cost_per_1m_out": 0.6,
187 "cost_per_1m_in_cached": 0,
188 "cost_per_1m_out_cached": 0.075,
189 "context_window": 128000,
190 "default_max_tokens": 20000,
191 "can_reason": false,
192 "reasoning_effort": "",
193 "supports_attachments": true
194 }
195 ]
196}