1use anyhow::{Result, anyhow};
2use collections::BTreeMap;
3use futures::{FutureExt, StreamExt, future, future::BoxFuture};
4use gpui::{AnyView, App, AsyncApp, Context, Entity, SharedString, Task, Window};
5use http_client::HttpClient;
6use language_model::{
7 AuthenticateError, LanguageModel, LanguageModelCompletionError, LanguageModelCompletionEvent,
8 LanguageModelId, LanguageModelName, LanguageModelProvider, LanguageModelProviderId,
9 LanguageModelProviderName, LanguageModelProviderState, LanguageModelRequest,
10 LanguageModelToolChoice, RateLimiter, Role,
11};
12use open_ai::ResponseStreamEvent;
13pub use settings::VercelAvailableModel as AvailableModel;
14use settings::{Settings, SettingsStore};
15use std::sync::{Arc, LazyLock};
16use strum::IntoEnumIterator;
17use ui::{List, prelude::*};
18use ui_input::InputField;
19use util::ResultExt;
20use vercel::{Model, VERCEL_API_URL};
21use zed_env_vars::{EnvVar, env_var};
22
23use crate::{
24 api_key::ApiKeyState,
25 ui::{ConfiguredApiCard, InstructionListItem},
26};
27
28const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("vercel");
29const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("Vercel");
30
31const API_KEY_ENV_VAR_NAME: &str = "VERCEL_API_KEY";
32static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
33
34#[derive(Clone, Debug, PartialEq)]
35pub struct VercelSettings {
36 pub api_url: String,
37 pub available_models: Vec<AvailableModel>,
38}
39
40pub struct VercelLanguageModelProvider {
41 http_client: Arc<dyn HttpClient>,
42 state: Entity<State>,
43}
44
45pub struct State {
46 api_key_state: ApiKeyState,
47}
48
49impl State {
50 fn is_authenticated(&self) -> bool {
51 self.api_key_state.has_key()
52 }
53
54 fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
55 let api_url = VercelLanguageModelProvider::api_url(cx);
56 self.api_key_state
57 .store(api_url, api_key, |this| &mut this.api_key_state, cx)
58 }
59
60 fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
61 let api_url = VercelLanguageModelProvider::api_url(cx);
62 self.api_key_state.load_if_needed(
63 api_url,
64 &API_KEY_ENV_VAR,
65 |this| &mut this.api_key_state,
66 cx,
67 )
68 }
69}
70
71impl VercelLanguageModelProvider {
72 pub fn new(http_client: Arc<dyn HttpClient>, cx: &mut App) -> Self {
73 let state = cx.new(|cx| {
74 cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
75 let api_url = Self::api_url(cx);
76 this.api_key_state.handle_url_change(
77 api_url,
78 &API_KEY_ENV_VAR,
79 |this| &mut this.api_key_state,
80 cx,
81 );
82 cx.notify();
83 })
84 .detach();
85 State {
86 api_key_state: ApiKeyState::new(Self::api_url(cx)),
87 }
88 });
89
90 Self { http_client, state }
91 }
92
93 fn create_language_model(&self, model: vercel::Model) -> Arc<dyn LanguageModel> {
94 Arc::new(VercelLanguageModel {
95 id: LanguageModelId::from(model.id().to_string()),
96 model,
97 state: self.state.clone(),
98 http_client: self.http_client.clone(),
99 request_limiter: RateLimiter::new(4),
100 })
101 }
102
103 fn settings(cx: &App) -> &VercelSettings {
104 &crate::AllLanguageModelSettings::get_global(cx).vercel
105 }
106
107 fn api_url(cx: &App) -> SharedString {
108 let api_url = &Self::settings(cx).api_url;
109 if api_url.is_empty() {
110 VERCEL_API_URL.into()
111 } else {
112 SharedString::new(api_url.as_str())
113 }
114 }
115}
116
117impl LanguageModelProviderState for VercelLanguageModelProvider {
118 type ObservableEntity = State;
119
120 fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
121 Some(self.state.clone())
122 }
123}
124
125impl LanguageModelProvider for VercelLanguageModelProvider {
126 fn id(&self) -> LanguageModelProviderId {
127 PROVIDER_ID
128 }
129
130 fn name(&self) -> LanguageModelProviderName {
131 PROVIDER_NAME
132 }
133
134 fn icon(&self) -> IconName {
135 IconName::AiVZero
136 }
137
138 fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
139 Some(self.create_language_model(vercel::Model::default()))
140 }
141
142 fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
143 Some(self.create_language_model(vercel::Model::default_fast()))
144 }
145
146 fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
147 let mut models = BTreeMap::default();
148
149 for model in vercel::Model::iter() {
150 if !matches!(model, vercel::Model::Custom { .. }) {
151 models.insert(model.id().to_string(), model);
152 }
153 }
154
155 for model in &Self::settings(cx).available_models {
156 models.insert(
157 model.name.clone(),
158 vercel::Model::Custom {
159 name: model.name.clone(),
160 display_name: model.display_name.clone(),
161 max_tokens: model.max_tokens,
162 max_output_tokens: model.max_output_tokens,
163 max_completion_tokens: model.max_completion_tokens,
164 },
165 );
166 }
167
168 models
169 .into_values()
170 .map(|model| self.create_language_model(model))
171 .collect()
172 }
173
174 fn is_authenticated(&self, cx: &App) -> bool {
175 self.state.read(cx).is_authenticated()
176 }
177
178 fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
179 self.state.update(cx, |state, cx| state.authenticate(cx))
180 }
181
182 fn configuration_view(
183 &self,
184 _target_agent: language_model::ConfigurationViewTargetAgent,
185 window: &mut Window,
186 cx: &mut App,
187 ) -> AnyView {
188 cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
189 .into()
190 }
191
192 fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
193 self.state
194 .update(cx, |state, cx| state.set_api_key(None, cx))
195 }
196}
197
198pub struct VercelLanguageModel {
199 id: LanguageModelId,
200 model: vercel::Model,
201 state: Entity<State>,
202 http_client: Arc<dyn HttpClient>,
203 request_limiter: RateLimiter,
204}
205
206impl VercelLanguageModel {
207 fn stream_completion(
208 &self,
209 request: open_ai::Request,
210 cx: &AsyncApp,
211 ) -> BoxFuture<'static, Result<futures::stream::BoxStream<'static, Result<ResponseStreamEvent>>>>
212 {
213 let http_client = self.http_client.clone();
214
215 let Ok((api_key, api_url)) = self.state.read_with(cx, |state, cx| {
216 let api_url = VercelLanguageModelProvider::api_url(cx);
217 (state.api_key_state.key(&api_url), api_url)
218 }) else {
219 return future::ready(Err(anyhow!("App state dropped"))).boxed();
220 };
221
222 let future = self.request_limiter.stream(async move {
223 let Some(api_key) = api_key else {
224 return Err(LanguageModelCompletionError::NoApiKey {
225 provider: PROVIDER_NAME,
226 });
227 };
228 let request =
229 open_ai::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
230 let response = request.await?;
231 Ok(response)
232 });
233
234 async move { Ok(future.await?.boxed()) }.boxed()
235 }
236}
237
238impl LanguageModel for VercelLanguageModel {
239 fn id(&self) -> LanguageModelId {
240 self.id.clone()
241 }
242
243 fn name(&self) -> LanguageModelName {
244 LanguageModelName::from(self.model.display_name().to_string())
245 }
246
247 fn provider_id(&self) -> LanguageModelProviderId {
248 PROVIDER_ID
249 }
250
251 fn provider_name(&self) -> LanguageModelProviderName {
252 PROVIDER_NAME
253 }
254
255 fn supports_tools(&self) -> bool {
256 true
257 }
258
259 fn supports_images(&self) -> bool {
260 true
261 }
262
263 fn supports_tool_choice(&self, choice: LanguageModelToolChoice) -> bool {
264 match choice {
265 LanguageModelToolChoice::Auto
266 | LanguageModelToolChoice::Any
267 | LanguageModelToolChoice::None => true,
268 }
269 }
270
271 fn telemetry_id(&self) -> String {
272 format!("vercel/{}", self.model.id())
273 }
274
275 fn max_token_count(&self) -> u64 {
276 self.model.max_token_count()
277 }
278
279 fn max_output_tokens(&self) -> Option<u64> {
280 self.model.max_output_tokens()
281 }
282
283 fn count_tokens(
284 &self,
285 request: LanguageModelRequest,
286 cx: &App,
287 ) -> BoxFuture<'static, Result<u64>> {
288 count_vercel_tokens(request, self.model.clone(), cx)
289 }
290
291 fn stream_completion(
292 &self,
293 request: LanguageModelRequest,
294 cx: &AsyncApp,
295 ) -> BoxFuture<
296 'static,
297 Result<
298 futures::stream::BoxStream<
299 'static,
300 Result<LanguageModelCompletionEvent, LanguageModelCompletionError>,
301 >,
302 LanguageModelCompletionError,
303 >,
304 > {
305 let request = crate::provider::open_ai::into_open_ai(
306 request,
307 self.model.id(),
308 self.model.supports_parallel_tool_calls(),
309 self.model.supports_prompt_cache_key(),
310 self.max_output_tokens(),
311 None,
312 );
313 let completions = self.stream_completion(request, cx);
314 async move {
315 let mapper = crate::provider::open_ai::OpenAiEventMapper::new();
316 Ok(mapper.map_stream(completions.await?).boxed())
317 }
318 .boxed()
319 }
320}
321
322pub fn count_vercel_tokens(
323 request: LanguageModelRequest,
324 model: Model,
325 cx: &App,
326) -> BoxFuture<'static, Result<u64>> {
327 cx.background_spawn(async move {
328 let messages = request
329 .messages
330 .into_iter()
331 .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
332 role: match message.role {
333 Role::User => "user".into(),
334 Role::Assistant => "assistant".into(),
335 Role::System => "system".into(),
336 },
337 content: Some(message.string_contents()),
338 name: None,
339 function_call: None,
340 })
341 .collect::<Vec<_>>();
342
343 match model {
344 Model::Custom { max_tokens, .. } => {
345 let model = if max_tokens >= 100_000 {
346 // If the max tokens is 100k or more, it is likely the o200k_base tokenizer from gpt4o
347 "gpt-4o"
348 } else {
349 // Otherwise fallback to gpt-4, since only cl100k_base and o200k_base are
350 // supported with this tiktoken method
351 "gpt-4"
352 };
353 tiktoken_rs::num_tokens_from_messages(model, &messages)
354 }
355 // Map Vercel models to appropriate OpenAI models for token counting
356 // since Vercel uses OpenAI-compatible API
357 Model::VZeroOnePointFiveMedium => {
358 // Vercel v0 is similar to GPT-4o, so use gpt-4o for token counting
359 tiktoken_rs::num_tokens_from_messages("gpt-4o", &messages)
360 }
361 }
362 .map(|tokens| tokens as u64)
363 })
364 .boxed()
365}
366
367struct ConfigurationView {
368 api_key_editor: Entity<InputField>,
369 state: Entity<State>,
370 load_credentials_task: Option<Task<()>>,
371}
372
373impl ConfigurationView {
374 fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
375 let api_key_editor = cx.new(|cx| {
376 InputField::new(
377 window,
378 cx,
379 "v1:0000000000000000000000000000000000000000000000000",
380 )
381 .label("API key")
382 });
383
384 cx.observe(&state, |_, _, cx| {
385 cx.notify();
386 })
387 .detach();
388
389 let load_credentials_task = Some(cx.spawn_in(window, {
390 let state = state.clone();
391 async move |this, cx| {
392 if let Some(task) = state
393 .update(cx, |state, cx| state.authenticate(cx))
394 .log_err()
395 {
396 // We don't log an error, because "not signed in" is also an error.
397 let _ = task.await;
398 }
399 this.update(cx, |this, cx| {
400 this.load_credentials_task = None;
401 cx.notify();
402 })
403 .log_err();
404 }
405 }));
406
407 Self {
408 api_key_editor,
409 state,
410 load_credentials_task,
411 }
412 }
413
414 fn save_api_key(&mut self, _: &menu::Confirm, window: &mut Window, cx: &mut Context<Self>) {
415 let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
416 if api_key.is_empty() {
417 return;
418 }
419
420 // url changes can cause the editor to be displayed again
421 self.api_key_editor
422 .update(cx, |editor, cx| editor.set_text("", window, cx));
423
424 let state = self.state.clone();
425 cx.spawn_in(window, async move |_, cx| {
426 state
427 .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))?
428 .await
429 })
430 .detach_and_log_err(cx);
431 }
432
433 fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
434 self.api_key_editor
435 .update(cx, |input, cx| input.set_text("", window, cx));
436
437 let state = self.state.clone();
438 cx.spawn_in(window, async move |_, cx| {
439 state
440 .update(cx, |state, cx| state.set_api_key(None, cx))?
441 .await
442 })
443 .detach_and_log_err(cx);
444 }
445
446 fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
447 !self.state.read(cx).is_authenticated()
448 }
449}
450
451impl Render for ConfigurationView {
452 fn render(&mut self, _: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
453 let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
454 let configured_card_label = if env_var_set {
455 format!("API key set in {API_KEY_ENV_VAR_NAME} environment variable")
456 } else {
457 let api_url = VercelLanguageModelProvider::api_url(cx);
458 if api_url == VERCEL_API_URL {
459 "API key configured".to_string()
460 } else {
461 format!("API key configured for {}", api_url)
462 }
463 };
464
465 let api_key_section = if self.should_render_editor(cx) {
466 v_flex()
467 .on_action(cx.listener(Self::save_api_key))
468 .child(Label::new("To use Zed's agent with Vercel v0, you need to add an API key. Follow these steps:"))
469 .child(
470 List::new()
471 .child(InstructionListItem::new(
472 "Create one by visiting",
473 Some("Vercel v0's console"),
474 Some("https://v0.dev/chat/settings/keys"),
475 ))
476 .child(InstructionListItem::text_only(
477 "Paste your API key below and hit enter to start using the agent",
478 )),
479 )
480 .child(self.api_key_editor.clone())
481 .child(
482 Label::new(format!(
483 "You can also assign the {API_KEY_ENV_VAR_NAME} environment variable and restart Zed."
484 ))
485 .size(LabelSize::Small)
486 .color(Color::Muted),
487 )
488 .child(
489 Label::new("Note that Vercel v0 is a custom OpenAI-compatible provider.")
490 .size(LabelSize::Small)
491 .color(Color::Muted),
492 )
493 .into_any_element()
494 } else {
495 ConfiguredApiCard::new(configured_card_label)
496 .disabled(env_var_set)
497 .when(env_var_set, |this| {
498 this.tooltip_label(format!("To reset your API key, unset the {API_KEY_ENV_VAR_NAME} environment variable."))
499 })
500 .on_click(cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)))
501 .into_any_element()
502 };
503
504 if self.load_credentials_task.is_some() {
505 div().child(Label::new("Loading credentials…")).into_any()
506 } else {
507 v_flex().size_full().child(api_key_section).into_any()
508 }
509 }
510}