1use anyhow::{Result, anyhow};
2use collections::{BTreeMap, HashMap};
3use credentials_provider::CredentialsProvider;
4use deepseek::DEEPSEEK_API_URL;
5
6use futures::Stream;
7use futures::{FutureExt, StreamExt, future::BoxFuture, stream::BoxStream};
8use gpui::{AnyView, App, AsyncApp, Context, Entity, SharedString, Task, Window};
9use http_client::HttpClient;
10use language_model::{
11 ApiKeyState, AuthenticateError, EnvVar, IconOrSvg, LanguageModel, LanguageModelCompletionError,
12 LanguageModelCompletionEvent, LanguageModelId, LanguageModelName, LanguageModelProvider,
13 LanguageModelProviderId, LanguageModelProviderName, LanguageModelProviderState,
14 LanguageModelRequest, LanguageModelToolChoice, LanguageModelToolResultContent,
15 LanguageModelToolUse, MessageContent, RateLimiter, Role, StopReason, TokenUsage, env_var,
16};
17pub use settings::DeepseekAvailableModel as AvailableModel;
18use settings::{Settings, SettingsStore};
19use std::pin::Pin;
20use std::sync::{Arc, LazyLock};
21
22use ui::{ButtonLink, ConfiguredApiCard, List, ListBulletItem, prelude::*};
23use ui_input::InputField;
24use util::ResultExt;
25
26use language_model::util::{fix_streamed_json, parse_tool_arguments};
27
28const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("deepseek");
29const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("DeepSeek");
30
31const API_KEY_ENV_VAR_NAME: &str = "DEEPSEEK_API_KEY";
32static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
33
34#[derive(Default)]
35struct RawToolCall {
36 id: String,
37 name: String,
38 arguments: String,
39}
40
41#[derive(Default, Clone, Debug, PartialEq)]
42pub struct DeepSeekSettings {
43 pub api_url: String,
44 pub available_models: Vec<AvailableModel>,
45}
46pub struct DeepSeekLanguageModelProvider {
47 http_client: Arc<dyn HttpClient>,
48 state: Entity<State>,
49}
50
51pub struct State {
52 api_key_state: ApiKeyState,
53 credentials_provider: Arc<dyn CredentialsProvider>,
54}
55
56impl State {
57 fn is_authenticated(&self) -> bool {
58 self.api_key_state.has_key()
59 }
60
61 fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
62 let credentials_provider = self.credentials_provider.clone();
63 let api_url = DeepSeekLanguageModelProvider::api_url(cx);
64 self.api_key_state.store(
65 api_url,
66 api_key,
67 |this| &mut this.api_key_state,
68 credentials_provider,
69 cx,
70 )
71 }
72
73 fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
74 let credentials_provider = self.credentials_provider.clone();
75 let api_url = DeepSeekLanguageModelProvider::api_url(cx);
76 self.api_key_state.load_if_needed(
77 api_url,
78 |this| &mut this.api_key_state,
79 credentials_provider,
80 cx,
81 )
82 }
83}
84
85impl DeepSeekLanguageModelProvider {
86 pub fn new(
87 http_client: Arc<dyn HttpClient>,
88 credentials_provider: Arc<dyn CredentialsProvider>,
89 cx: &mut App,
90 ) -> Self {
91 let state = cx.new(|cx| {
92 cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
93 let credentials_provider = this.credentials_provider.clone();
94 let api_url = Self::api_url(cx);
95 this.api_key_state.handle_url_change(
96 api_url,
97 |this| &mut this.api_key_state,
98 credentials_provider,
99 cx,
100 );
101 cx.notify();
102 })
103 .detach();
104 State {
105 api_key_state: ApiKeyState::new(Self::api_url(cx), (*API_KEY_ENV_VAR).clone()),
106 credentials_provider,
107 }
108 });
109
110 Self { http_client, state }
111 }
112
113 fn create_language_model(&self, model: deepseek::Model) -> Arc<dyn LanguageModel> {
114 Arc::new(DeepSeekLanguageModel {
115 id: LanguageModelId::from(model.id().to_string()),
116 model,
117 state: self.state.clone(),
118 http_client: self.http_client.clone(),
119 request_limiter: RateLimiter::new(4),
120 })
121 }
122
123 fn settings(cx: &App) -> &DeepSeekSettings {
124 &crate::AllLanguageModelSettings::get_global(cx).deepseek
125 }
126
127 fn api_url(cx: &App) -> SharedString {
128 let api_url = &Self::settings(cx).api_url;
129 if api_url.is_empty() {
130 DEEPSEEK_API_URL.into()
131 } else {
132 SharedString::new(api_url.as_str())
133 }
134 }
135}
136
137impl LanguageModelProviderState for DeepSeekLanguageModelProvider {
138 type ObservableEntity = State;
139
140 fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
141 Some(self.state.clone())
142 }
143}
144
145impl LanguageModelProvider for DeepSeekLanguageModelProvider {
146 fn id(&self) -> LanguageModelProviderId {
147 PROVIDER_ID
148 }
149
150 fn name(&self) -> LanguageModelProviderName {
151 PROVIDER_NAME
152 }
153
154 fn icon(&self) -> IconOrSvg {
155 IconOrSvg::Icon(IconName::AiDeepSeek)
156 }
157
158 fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
159 Some(self.create_language_model(deepseek::Model::default()))
160 }
161
162 fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
163 Some(self.create_language_model(deepseek::Model::default_fast()))
164 }
165
166 fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
167 let mut models = BTreeMap::default();
168
169 models.insert("deepseek-chat", deepseek::Model::Chat);
170 models.insert("deepseek-reasoner", deepseek::Model::Reasoner);
171
172 for available_model in &Self::settings(cx).available_models {
173 models.insert(
174 &available_model.name,
175 deepseek::Model::Custom {
176 name: available_model.name.clone(),
177 display_name: available_model.display_name.clone(),
178 max_tokens: available_model.max_tokens,
179 max_output_tokens: available_model.max_output_tokens,
180 },
181 );
182 }
183
184 models
185 .into_values()
186 .map(|model| self.create_language_model(model))
187 .collect()
188 }
189
190 fn is_authenticated(&self, cx: &App) -> bool {
191 self.state.read(cx).is_authenticated()
192 }
193
194 fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
195 self.state.update(cx, |state, cx| state.authenticate(cx))
196 }
197
198 fn configuration_view(
199 &self,
200 _target_agent: language_model::ConfigurationViewTargetAgent,
201 window: &mut Window,
202 cx: &mut App,
203 ) -> AnyView {
204 cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
205 .into()
206 }
207
208 fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
209 self.state
210 .update(cx, |state, cx| state.set_api_key(None, cx))
211 }
212}
213
214pub struct DeepSeekLanguageModel {
215 id: LanguageModelId,
216 model: deepseek::Model,
217 state: Entity<State>,
218 http_client: Arc<dyn HttpClient>,
219 request_limiter: RateLimiter,
220}
221
222impl DeepSeekLanguageModel {
223 fn stream_completion(
224 &self,
225 request: deepseek::Request,
226 cx: &AsyncApp,
227 ) -> BoxFuture<'static, Result<BoxStream<'static, Result<deepseek::StreamResponse>>>> {
228 let http_client = self.http_client.clone();
229
230 let (api_key, api_url) = self.state.read_with(cx, |state, cx| {
231 let api_url = DeepSeekLanguageModelProvider::api_url(cx);
232 (state.api_key_state.key(&api_url), api_url)
233 });
234
235 let future = self.request_limiter.stream(async move {
236 let Some(api_key) = api_key else {
237 return Err(LanguageModelCompletionError::NoApiKey {
238 provider: PROVIDER_NAME,
239 });
240 };
241 let request =
242 deepseek::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
243 let response = request.await?;
244 Ok(response)
245 });
246
247 async move { Ok(future.await?.boxed()) }.boxed()
248 }
249}
250
251impl LanguageModel for DeepSeekLanguageModel {
252 fn id(&self) -> LanguageModelId {
253 self.id.clone()
254 }
255
256 fn name(&self) -> LanguageModelName {
257 LanguageModelName::from(self.model.display_name().to_string())
258 }
259
260 fn provider_id(&self) -> LanguageModelProviderId {
261 PROVIDER_ID
262 }
263
264 fn provider_name(&self) -> LanguageModelProviderName {
265 PROVIDER_NAME
266 }
267
268 fn supports_tools(&self) -> bool {
269 true
270 }
271
272 fn supports_streaming_tools(&self) -> bool {
273 true
274 }
275
276 fn supports_tool_choice(&self, _choice: LanguageModelToolChoice) -> bool {
277 true
278 }
279
280 fn supports_images(&self) -> bool {
281 false
282 }
283
284 fn telemetry_id(&self) -> String {
285 format!("deepseek/{}", self.model.id())
286 }
287
288 fn max_token_count(&self) -> u64 {
289 self.model.max_token_count()
290 }
291
292 fn max_output_tokens(&self) -> Option<u64> {
293 self.model.max_output_tokens()
294 }
295
296 fn count_tokens(
297 &self,
298 request: LanguageModelRequest,
299 cx: &App,
300 ) -> BoxFuture<'static, Result<u64>> {
301 cx.background_spawn(async move {
302 let messages = request
303 .messages
304 .into_iter()
305 .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
306 role: match message.role {
307 Role::User => "user".into(),
308 Role::Assistant => "assistant".into(),
309 Role::System => "system".into(),
310 },
311 content: Some(message.string_contents()),
312 name: None,
313 function_call: None,
314 })
315 .collect::<Vec<_>>();
316
317 tiktoken_rs::num_tokens_from_messages("gpt-4", &messages).map(|tokens| tokens as u64)
318 })
319 .boxed()
320 }
321
322 fn stream_completion(
323 &self,
324 request: LanguageModelRequest,
325 cx: &AsyncApp,
326 ) -> BoxFuture<
327 'static,
328 Result<
329 BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
330 LanguageModelCompletionError,
331 >,
332 > {
333 let request = into_deepseek(request, &self.model, self.max_output_tokens());
334 let stream = self.stream_completion(request, cx);
335
336 async move {
337 let mapper = DeepSeekEventMapper::new();
338 Ok(mapper.map_stream(stream.await?).boxed())
339 }
340 .boxed()
341 }
342}
343
344pub fn into_deepseek(
345 request: LanguageModelRequest,
346 model: &deepseek::Model,
347 max_output_tokens: Option<u64>,
348) -> deepseek::Request {
349 let is_reasoner = model == &deepseek::Model::Reasoner;
350
351 let mut messages = Vec::new();
352 let mut current_reasoning: Option<String> = None;
353
354 for message in request.messages {
355 for content in message.content {
356 match content {
357 MessageContent::Text(text) => {
358 let should_add = if message.role == Role::User {
359 !text.trim().is_empty()
360 } else {
361 !text.is_empty()
362 };
363
364 if should_add {
365 messages.push(match message.role {
366 Role::User => deepseek::RequestMessage::User { content: text },
367 Role::Assistant => deepseek::RequestMessage::Assistant {
368 content: Some(text),
369 tool_calls: Vec::new(),
370 reasoning_content: current_reasoning.take(),
371 },
372 Role::System => deepseek::RequestMessage::System { content: text },
373 });
374 }
375 }
376 MessageContent::Thinking { text, .. } => {
377 // Accumulate reasoning content for next assistant message
378 current_reasoning.get_or_insert_default().push_str(&text);
379 }
380 MessageContent::RedactedThinking(_) => {}
381 MessageContent::Image(_) => {}
382 MessageContent::ToolUse(tool_use) => {
383 let tool_call = deepseek::ToolCall {
384 id: tool_use.id.to_string(),
385 content: deepseek::ToolCallContent::Function {
386 function: deepseek::FunctionContent {
387 name: tool_use.name.to_string(),
388 arguments: serde_json::to_string(&tool_use.input)
389 .unwrap_or_default(),
390 },
391 },
392 };
393
394 if let Some(deepseek::RequestMessage::Assistant { tool_calls, .. }) =
395 messages.last_mut()
396 {
397 tool_calls.push(tool_call);
398 } else {
399 messages.push(deepseek::RequestMessage::Assistant {
400 content: None,
401 tool_calls: vec![tool_call],
402 reasoning_content: current_reasoning.take(),
403 });
404 }
405 }
406 MessageContent::ToolResult(tool_result) => {
407 match &tool_result.content {
408 LanguageModelToolResultContent::Text(text) => {
409 messages.push(deepseek::RequestMessage::Tool {
410 content: text.to_string(),
411 tool_call_id: tool_result.tool_use_id.to_string(),
412 });
413 }
414 LanguageModelToolResultContent::Image(_) => {}
415 };
416 }
417 }
418 }
419 }
420
421 deepseek::Request {
422 model: model.id().to_string(),
423 messages,
424 stream: true,
425 max_tokens: max_output_tokens,
426 temperature: if is_reasoner {
427 None
428 } else {
429 request.temperature
430 },
431 response_format: None,
432 tools: request
433 .tools
434 .into_iter()
435 .map(|tool| deepseek::ToolDefinition::Function {
436 function: deepseek::FunctionDefinition {
437 name: tool.name,
438 description: Some(tool.description),
439 parameters: Some(tool.input_schema),
440 },
441 })
442 .collect(),
443 }
444}
445
446pub struct DeepSeekEventMapper {
447 tool_calls_by_index: HashMap<usize, RawToolCall>,
448}
449
450impl DeepSeekEventMapper {
451 pub fn new() -> Self {
452 Self {
453 tool_calls_by_index: HashMap::default(),
454 }
455 }
456
457 pub fn map_stream(
458 mut self,
459 events: Pin<Box<dyn Send + Stream<Item = Result<deepseek::StreamResponse>>>>,
460 ) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>
461 {
462 events.flat_map(move |event| {
463 futures::stream::iter(match event {
464 Ok(event) => self.map_event(event),
465 Err(error) => vec![Err(LanguageModelCompletionError::from(error))],
466 })
467 })
468 }
469
470 pub fn map_event(
471 &mut self,
472 event: deepseek::StreamResponse,
473 ) -> Vec<Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
474 let Some(choice) = event.choices.first() else {
475 return vec![Err(LanguageModelCompletionError::from(anyhow!(
476 "Response contained no choices"
477 )))];
478 };
479
480 let mut events = Vec::new();
481 if let Some(content) = choice.delta.content.clone()
482 && !content.is_empty()
483 {
484 events.push(Ok(LanguageModelCompletionEvent::Text(content)));
485 }
486
487 if let Some(reasoning_content) = choice.delta.reasoning_content.clone() {
488 events.push(Ok(LanguageModelCompletionEvent::Thinking {
489 text: reasoning_content,
490 signature: None,
491 }));
492 }
493
494 if let Some(tool_calls) = choice.delta.tool_calls.as_ref() {
495 for tool_call in tool_calls {
496 let entry = self.tool_calls_by_index.entry(tool_call.index).or_default();
497
498 if let Some(tool_id) = tool_call.id.clone() {
499 entry.id = tool_id;
500 }
501
502 if let Some(function) = tool_call.function.as_ref() {
503 if let Some(name) = function.name.clone() {
504 entry.name = name;
505 }
506
507 if let Some(arguments) = function.arguments.clone() {
508 entry.arguments.push_str(&arguments);
509 }
510 }
511
512 if !entry.id.is_empty() && !entry.name.is_empty() {
513 if let Ok(input) = serde_json::from_str::<serde_json::Value>(
514 &fix_streamed_json(&entry.arguments),
515 ) {
516 events.push(Ok(LanguageModelCompletionEvent::ToolUse(
517 LanguageModelToolUse {
518 id: entry.id.clone().into(),
519 name: entry.name.as_str().into(),
520 is_input_complete: false,
521 input,
522 raw_input: entry.arguments.clone(),
523 thought_signature: None,
524 },
525 )));
526 }
527 }
528 }
529 }
530
531 if let Some(usage) = event.usage {
532 events.push(Ok(LanguageModelCompletionEvent::UsageUpdate(TokenUsage {
533 input_tokens: usage.prompt_tokens,
534 output_tokens: usage.completion_tokens,
535 cache_creation_input_tokens: 0,
536 cache_read_input_tokens: 0,
537 })));
538 }
539
540 match choice.finish_reason.as_deref() {
541 Some("stop") => {
542 events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
543 }
544 Some("tool_calls") => {
545 events.extend(self.tool_calls_by_index.drain().map(|(_, tool_call)| {
546 match parse_tool_arguments(&tool_call.arguments) {
547 Ok(input) => Ok(LanguageModelCompletionEvent::ToolUse(
548 LanguageModelToolUse {
549 id: tool_call.id.clone().into(),
550 name: tool_call.name.as_str().into(),
551 is_input_complete: true,
552 input,
553 raw_input: tool_call.arguments.clone(),
554 thought_signature: None,
555 },
556 )),
557 Err(error) => Ok(LanguageModelCompletionEvent::ToolUseJsonParseError {
558 id: tool_call.id.clone().into(),
559 tool_name: tool_call.name.as_str().into(),
560 raw_input: tool_call.arguments.into(),
561 json_parse_error: error.to_string(),
562 }),
563 }
564 }));
565
566 events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::ToolUse)));
567 }
568 Some(stop_reason) => {
569 log::error!("Unexpected DeepSeek stop_reason: {stop_reason:?}",);
570 events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
571 }
572 None => {}
573 }
574
575 events
576 }
577}
578
579struct ConfigurationView {
580 api_key_editor: Entity<InputField>,
581 state: Entity<State>,
582 load_credentials_task: Option<Task<()>>,
583}
584
585impl ConfigurationView {
586 fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
587 let api_key_editor =
588 cx.new(|cx| InputField::new(window, cx, "sk-00000000000000000000000000000000"));
589
590 cx.observe(&state, |_, _, cx| {
591 cx.notify();
592 })
593 .detach();
594
595 let load_credentials_task = Some(cx.spawn({
596 let state = state.clone();
597 async move |this, cx| {
598 if let Some(task) = Some(state.update(cx, |state, cx| state.authenticate(cx))) {
599 let _ = task.await;
600 }
601
602 this.update(cx, |this, cx| {
603 this.load_credentials_task = None;
604 cx.notify();
605 })
606 .log_err();
607 }
608 }));
609
610 Self {
611 api_key_editor,
612 state,
613 load_credentials_task,
614 }
615 }
616
617 fn save_api_key(&mut self, _: &menu::Confirm, _window: &mut Window, cx: &mut Context<Self>) {
618 let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
619 if api_key.is_empty() {
620 return;
621 }
622
623 let state = self.state.clone();
624 cx.spawn(async move |_, cx| {
625 state
626 .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))
627 .await
628 })
629 .detach_and_log_err(cx);
630 }
631
632 fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
633 self.api_key_editor
634 .update(cx, |editor, cx| editor.set_text("", window, cx));
635
636 let state = self.state.clone();
637 cx.spawn(async move |_, cx| {
638 state
639 .update(cx, |state, cx| state.set_api_key(None, cx))
640 .await
641 })
642 .detach_and_log_err(cx);
643 }
644
645 fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
646 !self.state.read(cx).is_authenticated()
647 }
648}
649
650impl Render for ConfigurationView {
651 fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
652 let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
653 let configured_card_label = if env_var_set {
654 format!("API key set in {API_KEY_ENV_VAR_NAME} environment variable")
655 } else {
656 let api_url = DeepSeekLanguageModelProvider::api_url(cx);
657 if api_url == DEEPSEEK_API_URL {
658 "API key configured".to_string()
659 } else {
660 format!("API key configured for {}", api_url)
661 }
662 };
663
664 if self.load_credentials_task.is_some() {
665 div()
666 .child(Label::new("Loading credentials..."))
667 .into_any_element()
668 } else if self.should_render_editor(cx) {
669 v_flex()
670 .size_full()
671 .on_action(cx.listener(Self::save_api_key))
672 .child(Label::new("To use DeepSeek in Zed, you need an API key:"))
673 .child(
674 List::new()
675 .child(
676 ListBulletItem::new("")
677 .child(Label::new("Get your API key from the"))
678 .child(ButtonLink::new(
679 "DeepSeek console",
680 "https://platform.deepseek.com/api_keys",
681 )),
682 )
683 .child(ListBulletItem::new(
684 "Paste your API key below and hit enter to start using the assistant",
685 )),
686 )
687 .child(self.api_key_editor.clone())
688 .child(
689 Label::new(format!(
690 "You can also set the {API_KEY_ENV_VAR_NAME} environment variable and restart Zed."
691 ))
692 .size(LabelSize::Small)
693 .color(Color::Muted),
694 )
695 .into_any_element()
696 } else {
697 ConfiguredApiCard::new(configured_card_label)
698 .disabled(env_var_set)
699 .on_click(cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)))
700 .into_any_element()
701 }
702 }
703}