1use crate::{
2 DebugEvent, EditPredictionFinishedDebugEvent, EditPredictionId, EditPredictionModelInput,
3 EditPredictionStartedDebugEvent, EditPredictionStore, open_ai_response::text_from_response,
4 prediction::EditPredictionResult, zeta::compute_edits,
5};
6use anyhow::{Context as _, Result};
7use cloud_llm_client::EditPredictionRejectReason;
8use futures::AsyncReadExt as _;
9use gpui::{
10 App, AppContext as _, Context, Entity, Global, SharedString, Task,
11 http_client::{self, AsyncBody, HttpClient, Method, StatusCode},
12};
13use language::{ToOffset, ToPoint as _};
14use language_model::{ApiKeyState, EnvVar, env_var};
15use release_channel::AppVersion;
16use serde::{Deserialize, Serialize};
17use std::{mem, ops::Range, path::Path, sync::Arc, time::Instant};
18use zeta_prompt::ZetaPromptInput;
19
20const MERCURY_API_URL: &str = "https://api.inceptionlabs.ai/v1/edit/completions";
21
22pub struct Mercury {
23 pub api_token: Entity<ApiKeyState>,
24 payment_required_error: bool,
25}
26
27impl Mercury {
28 pub fn new(cx: &mut App) -> Self {
29 Mercury {
30 api_token: mercury_api_token(cx),
31 payment_required_error: false,
32 }
33 }
34
35 pub fn has_payment_required_error(&self) -> bool {
36 self.payment_required_error
37 }
38
39 pub fn set_payment_required_error(&mut self, payment_required_error: bool) {
40 self.payment_required_error = payment_required_error;
41 }
42
43 pub(crate) fn request_prediction(
44 &mut self,
45 EditPredictionModelInput {
46 buffer,
47 snapshot,
48 position,
49 events,
50 related_files,
51 debug_tx,
52 ..
53 }: EditPredictionModelInput,
54 cx: &mut Context<EditPredictionStore>,
55 ) -> Task<Result<Option<EditPredictionResult>>> {
56 self.api_token.update(cx, |key_state, cx| {
57 _ = key_state.load_if_needed(MERCURY_CREDENTIALS_URL, |s| s, cx);
58 });
59 let Some(api_token) = self.api_token.read(cx).key(&MERCURY_CREDENTIALS_URL) else {
60 return Task::ready(Ok(None));
61 };
62 let full_path: Arc<Path> = snapshot
63 .file()
64 .map(|file| file.full_path(cx))
65 .unwrap_or_else(|| "untitled".into())
66 .into();
67
68 let http_client = cx.http_client();
69 let cursor_point = position.to_point(&snapshot);
70 let buffer_snapshotted_at = Instant::now();
71 let active_buffer = buffer.clone();
72
73 let result = cx.background_spawn(async move {
74 let cursor_offset = cursor_point.to_offset(&snapshot);
75 let (excerpt_point_range, excerpt_offset_range, cursor_offset_in_excerpt) =
76 crate::cursor_excerpt::compute_cursor_excerpt(&snapshot, cursor_offset);
77
78 let related_files = zeta_prompt::filter_redundant_excerpts(
79 related_files,
80 full_path.as_ref(),
81 excerpt_point_range.start.row..excerpt_point_range.end.row,
82 );
83
84 let cursor_excerpt: Arc<str> = snapshot
85 .text_for_range(excerpt_point_range.clone())
86 .collect::<String>()
87 .into();
88 let syntax_ranges = crate::cursor_excerpt::compute_syntax_ranges(
89 &snapshot,
90 cursor_offset,
91 &excerpt_offset_range,
92 );
93 let excerpt_ranges = zeta_prompt::compute_legacy_excerpt_ranges(
94 &cursor_excerpt,
95 cursor_offset_in_excerpt,
96 &syntax_ranges,
97 );
98
99 let editable_offset_range = (excerpt_offset_range.start
100 + excerpt_ranges.editable_350.start)
101 ..(excerpt_offset_range.start + excerpt_ranges.editable_350.end);
102
103 let inputs = zeta_prompt::ZetaPromptInput {
104 events,
105 related_files: Some(related_files),
106 cursor_offset_in_excerpt: cursor_point.to_offset(&snapshot)
107 - excerpt_offset_range.start,
108 cursor_path: full_path.clone(),
109 cursor_excerpt,
110 experiment: None,
111 excerpt_start_row: Some(excerpt_point_range.start.row),
112 excerpt_ranges,
113 syntax_ranges: Some(syntax_ranges),
114 active_buffer_diagnostics: vec![],
115 in_open_source_repo: false,
116 can_collect_data: false,
117 repo_url: None,
118 };
119
120 let prompt = build_prompt(&inputs);
121
122 if let Some(debug_tx) = &debug_tx {
123 debug_tx
124 .unbounded_send(DebugEvent::EditPredictionStarted(
125 EditPredictionStartedDebugEvent {
126 buffer: active_buffer.downgrade(),
127 prompt: Some(prompt.clone()),
128 position,
129 },
130 ))
131 .ok();
132 }
133
134 let request_body = open_ai::Request {
135 model: "mercury-coder".into(),
136 messages: vec![open_ai::RequestMessage::User {
137 content: open_ai::MessageContent::Plain(prompt),
138 }],
139 stream: false,
140 max_completion_tokens: None,
141 stop: vec![],
142 temperature: None,
143 tool_choice: None,
144 parallel_tool_calls: None,
145 tools: vec![],
146 prompt_cache_key: None,
147 reasoning_effort: None,
148 };
149
150 let buf = serde_json::to_vec(&request_body)?;
151 let body: AsyncBody = buf.into();
152
153 let request = http_client::Request::builder()
154 .uri(MERCURY_API_URL)
155 .header("Content-Type", "application/json")
156 .header("Authorization", format!("Bearer {}", api_token))
157 .header("Connection", "keep-alive")
158 .method(Method::POST)
159 .body(body)
160 .context("Failed to create request")?;
161
162 let mut response = http_client
163 .send(request)
164 .await
165 .context("Failed to send request")?;
166
167 let mut body: Vec<u8> = Vec::new();
168 response
169 .body_mut()
170 .read_to_end(&mut body)
171 .await
172 .context("Failed to read response body")?;
173
174 let response_received_at = Instant::now();
175 if !response.status().is_success() {
176 if response.status() == StatusCode::PAYMENT_REQUIRED {
177 anyhow::bail!(MercuryPaymentRequiredError(
178 mercury_payment_required_message(&body),
179 ));
180 }
181
182 anyhow::bail!(
183 "Request failed with status: {:?}\nBody: {}",
184 response.status(),
185 String::from_utf8_lossy(&body),
186 );
187 };
188
189 let mut response: open_ai::Response =
190 serde_json::from_slice(&body).context("Failed to parse response")?;
191
192 let id = mem::take(&mut response.id);
193 let response_str = text_from_response(response).unwrap_or_default();
194
195 if let Some(debug_tx) = &debug_tx {
196 debug_tx
197 .unbounded_send(DebugEvent::EditPredictionFinished(
198 EditPredictionFinishedDebugEvent {
199 buffer: active_buffer.downgrade(),
200 model_output: Some(response_str.clone()),
201 position,
202 },
203 ))
204 .ok();
205 }
206
207 let response_str = response_str.strip_prefix("```\n").unwrap_or(&response_str);
208 let response_str = response_str.strip_suffix("\n```").unwrap_or(&response_str);
209
210 let mut edits = Vec::new();
211 const NO_PREDICTION_OUTPUT: &str = "None";
212
213 if response_str != NO_PREDICTION_OUTPUT {
214 let old_text = snapshot
215 .text_for_range(editable_offset_range.clone())
216 .collect::<String>();
217 edits = compute_edits(
218 old_text,
219 &response_str,
220 editable_offset_range.start,
221 &snapshot,
222 );
223 }
224
225 anyhow::Ok((id, edits, snapshot, response_received_at, inputs))
226 });
227
228 cx.spawn(async move |ep_store, cx| {
229 let result = result.await.context("Mercury edit prediction failed");
230
231 let has_payment_required_error = result
232 .as_ref()
233 .err()
234 .is_some_and(is_mercury_payment_required_error);
235
236 ep_store.update(cx, |store, cx| {
237 store
238 .mercury
239 .set_payment_required_error(has_payment_required_error);
240 cx.notify();
241 })?;
242
243 let (id, edits, old_snapshot, response_received_at, inputs) = result?;
244 anyhow::Ok(Some(
245 EditPredictionResult::new(
246 EditPredictionId(id.into()),
247 &buffer,
248 &old_snapshot,
249 edits.into(),
250 None,
251 buffer_snapshotted_at,
252 response_received_at,
253 inputs,
254 None,
255 cx,
256 )
257 .await,
258 ))
259 })
260 }
261}
262
263fn build_prompt(inputs: &ZetaPromptInput) -> String {
264 const RECENTLY_VIEWED_SNIPPETS_START: &str = "<|recently_viewed_code_snippets|>\n";
265 const RECENTLY_VIEWED_SNIPPETS_END: &str = "<|/recently_viewed_code_snippets|>\n";
266 const RECENTLY_VIEWED_SNIPPET_START: &str = "<|recently_viewed_code_snippet|>\n";
267 const RECENTLY_VIEWED_SNIPPET_END: &str = "<|/recently_viewed_code_snippet|>\n";
268 const CURRENT_FILE_CONTENT_START: &str = "<|current_file_content|>\n";
269 const CURRENT_FILE_CONTENT_END: &str = "<|/current_file_content|>\n";
270 const CODE_TO_EDIT_START: &str = "<|code_to_edit|>\n";
271 const CODE_TO_EDIT_END: &str = "<|/code_to_edit|>\n";
272 const EDIT_DIFF_HISTORY_START: &str = "<|edit_diff_history|>\n";
273 const EDIT_DIFF_HISTORY_END: &str = "<|/edit_diff_history|>\n";
274 const CURSOR_TAG: &str = "<|cursor|>";
275 const CODE_SNIPPET_FILE_PATH_PREFIX: &str = "code_snippet_file_path: ";
276 const CURRENT_FILE_PATH_PREFIX: &str = "current_file_path: ";
277
278 let mut prompt = String::new();
279
280 push_delimited(
281 &mut prompt,
282 RECENTLY_VIEWED_SNIPPETS_START..RECENTLY_VIEWED_SNIPPETS_END,
283 |prompt| {
284 for related_file in inputs.related_files.as_deref().unwrap_or_default().iter() {
285 for related_excerpt in &related_file.excerpts {
286 push_delimited(
287 prompt,
288 RECENTLY_VIEWED_SNIPPET_START..RECENTLY_VIEWED_SNIPPET_END,
289 |prompt| {
290 prompt.push_str(CODE_SNIPPET_FILE_PATH_PREFIX);
291 prompt.push_str(related_file.path.to_string_lossy().as_ref());
292 prompt.push('\n');
293 prompt.push_str(related_excerpt.text.as_ref());
294 },
295 );
296 }
297 }
298 },
299 );
300
301 push_delimited(
302 &mut prompt,
303 CURRENT_FILE_CONTENT_START..CURRENT_FILE_CONTENT_END,
304 |prompt| {
305 prompt.push_str(CURRENT_FILE_PATH_PREFIX);
306 prompt.push_str(inputs.cursor_path.as_os_str().to_string_lossy().as_ref());
307 prompt.push('\n');
308
309 let editable_range = &inputs.excerpt_ranges.editable_350;
310 prompt.push_str(&inputs.cursor_excerpt[0..editable_range.start]);
311 push_delimited(prompt, CODE_TO_EDIT_START..CODE_TO_EDIT_END, |prompt| {
312 prompt.push_str(
313 &inputs.cursor_excerpt[editable_range.start..inputs.cursor_offset_in_excerpt],
314 );
315 prompt.push_str(CURSOR_TAG);
316 prompt.push_str(
317 &inputs.cursor_excerpt[inputs.cursor_offset_in_excerpt..editable_range.end],
318 );
319 });
320 prompt.push_str(&inputs.cursor_excerpt[editable_range.end..]);
321 },
322 );
323
324 push_delimited(
325 &mut prompt,
326 EDIT_DIFF_HISTORY_START..EDIT_DIFF_HISTORY_END,
327 |prompt| {
328 for event in inputs.events.iter() {
329 zeta_prompt::write_event(prompt, &event);
330 }
331 },
332 );
333
334 prompt
335}
336
337fn push_delimited(prompt: &mut String, delimiters: Range<&str>, cb: impl FnOnce(&mut String)) {
338 prompt.push_str(delimiters.start);
339 cb(prompt);
340 prompt.push('\n');
341 prompt.push_str(delimiters.end);
342}
343
344pub const MERCURY_CREDENTIALS_URL: SharedString =
345 SharedString::new_static("https://api.inceptionlabs.ai/v1/edit/completions");
346pub const MERCURY_CREDENTIALS_USERNAME: &str = "mercury-api-token";
347
348#[derive(Debug, thiserror::Error)]
349#[error("{0}")]
350struct MercuryPaymentRequiredError(SharedString);
351
352#[derive(Deserialize)]
353struct MercuryErrorResponse {
354 error: MercuryErrorMessage,
355}
356
357#[derive(Deserialize)]
358struct MercuryErrorMessage {
359 message: String,
360}
361
362fn is_mercury_payment_required_error(error: &anyhow::Error) -> bool {
363 error
364 .downcast_ref::<MercuryPaymentRequiredError>()
365 .is_some()
366}
367
368fn mercury_payment_required_message(body: &[u8]) -> SharedString {
369 serde_json::from_slice::<MercuryErrorResponse>(body)
370 .map(|response| response.error.message.into())
371 .unwrap_or_else(|_| String::from_utf8_lossy(body).trim().to_string().into())
372}
373
374pub static MERCURY_TOKEN_ENV_VAR: std::sync::LazyLock<EnvVar> = env_var!("MERCURY_AI_TOKEN");
375
376struct GlobalMercuryApiKey(Entity<ApiKeyState>);
377
378impl Global for GlobalMercuryApiKey {}
379
380pub fn mercury_api_token(cx: &mut App) -> Entity<ApiKeyState> {
381 if let Some(global) = cx.try_global::<GlobalMercuryApiKey>() {
382 return global.0.clone();
383 }
384 let entity =
385 cx.new(|_| ApiKeyState::new(MERCURY_CREDENTIALS_URL, MERCURY_TOKEN_ENV_VAR.clone()));
386 cx.set_global(GlobalMercuryApiKey(entity.clone()));
387 entity
388}
389
390pub fn load_mercury_api_token(cx: &mut App) -> Task<Result<(), language_model::AuthenticateError>> {
391 mercury_api_token(cx).update(cx, |key_state, cx| {
392 key_state.load_if_needed(MERCURY_CREDENTIALS_URL, |s| s, cx)
393 })
394}
395
396const FEEDBACK_API_URL: &str = "https://api-feedback.inceptionlabs.ai/feedback";
397
398#[derive(Debug, Clone, Copy, PartialEq, Eq, Serialize)]
399#[serde(rename_all = "snake_case")]
400enum MercuryUserAction {
401 Accept,
402 Reject,
403 Ignore,
404}
405
406#[derive(Serialize)]
407struct FeedbackRequest {
408 request_id: SharedString,
409 provider_name: &'static str,
410 user_action: MercuryUserAction,
411 provider_version: String,
412}
413
414pub(crate) fn edit_prediction_accepted(
415 prediction_id: EditPredictionId,
416 http_client: Arc<dyn HttpClient>,
417 cx: &App,
418) {
419 send_feedback(prediction_id, MercuryUserAction::Accept, http_client, cx);
420}
421
422pub(crate) fn edit_prediction_rejected(
423 prediction_id: EditPredictionId,
424 was_shown: bool,
425 reason: EditPredictionRejectReason,
426 http_client: Arc<dyn HttpClient>,
427 cx: &App,
428) {
429 if !was_shown {
430 return;
431 }
432 let action = match reason {
433 EditPredictionRejectReason::Rejected => MercuryUserAction::Reject,
434 EditPredictionRejectReason::Discarded => MercuryUserAction::Ignore,
435 _ => return,
436 };
437 send_feedback(prediction_id, action, http_client, cx);
438}
439
440fn send_feedback(
441 prediction_id: EditPredictionId,
442 action: MercuryUserAction,
443 http_client: Arc<dyn HttpClient>,
444 cx: &App,
445) {
446 let request_id = prediction_id.0;
447 let app_version = AppVersion::global(cx);
448 cx.background_spawn(async move {
449 let body = FeedbackRequest {
450 request_id,
451 provider_name: "zed",
452 user_action: action,
453 provider_version: app_version.to_string(),
454 };
455
456 let request = http_client::Request::builder()
457 .uri(FEEDBACK_API_URL)
458 .method(Method::POST)
459 .header("Content-Type", "application/json")
460 .body(AsyncBody::from(serde_json::to_vec(&body)?))?;
461
462 let response = http_client.send(request).await?;
463 if !response.status().is_success() {
464 anyhow::bail!("Feedback API returned status: {}", response.status());
465 }
466
467 log::debug!(
468 "Mercury feedback sent: request_id={}, action={:?}",
469 body.request_id,
470 body.user_action
471 );
472
473 anyhow::Ok(())
474 })
475 .detach_and_log_err(cx);
476}