deepseek.rs

  1use anyhow::{Result, anyhow};
  2use collections::{BTreeMap, HashMap};
  3use deepseek::DEEPSEEK_API_URL;
  4
  5use futures::Stream;
  6use futures::{FutureExt, StreamExt, future::BoxFuture, stream::BoxStream};
  7use gpui::{AnyView, App, AsyncApp, Context, Entity, SharedString, Task, Window};
  8use http_client::HttpClient;
  9use language_model::{
 10    ApiKeyState, AuthenticateError, EnvVar, IconOrSvg, LanguageModel, LanguageModelCompletionError,
 11    LanguageModelCompletionEvent, LanguageModelId, LanguageModelName, LanguageModelProvider,
 12    LanguageModelProviderId, LanguageModelProviderName, LanguageModelProviderState,
 13    LanguageModelRequest, LanguageModelToolChoice, LanguageModelToolResultContent,
 14    LanguageModelToolUse, MessageContent, RateLimiter, Role, StopReason, TokenUsage, env_var,
 15};
 16pub use settings::DeepseekAvailableModel as AvailableModel;
 17use settings::{Settings, SettingsStore};
 18use std::pin::Pin;
 19use std::sync::{Arc, LazyLock};
 20
 21use ui::{ButtonLink, ConfiguredApiCard, List, ListBulletItem, prelude::*};
 22use ui_input::InputField;
 23use util::ResultExt;
 24
 25use crate::provider::util::{fix_streamed_json, parse_tool_arguments};
 26
 27const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("deepseek");
 28const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("DeepSeek");
 29
 30const API_KEY_ENV_VAR_NAME: &str = "DEEPSEEK_API_KEY";
 31static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
 32
 33#[derive(Default)]
 34struct RawToolCall {
 35    id: String,
 36    name: String,
 37    arguments: String,
 38}
 39
 40#[derive(Default, Clone, Debug, PartialEq)]
 41pub struct DeepSeekSettings {
 42    pub api_url: String,
 43    pub available_models: Vec<AvailableModel>,
 44}
 45pub struct DeepSeekLanguageModelProvider {
 46    http_client: Arc<dyn HttpClient>,
 47    state: Entity<State>,
 48}
 49
 50pub struct State {
 51    api_key_state: ApiKeyState,
 52}
 53
 54impl State {
 55    fn is_authenticated(&self) -> bool {
 56        self.api_key_state.has_key()
 57    }
 58
 59    fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
 60        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 61        self.api_key_state
 62            .store(api_url, api_key, |this| &mut this.api_key_state, cx)
 63    }
 64
 65    fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
 66        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 67        self.api_key_state
 68            .load_if_needed(api_url, |this| &mut this.api_key_state, cx)
 69    }
 70}
 71
 72impl DeepSeekLanguageModelProvider {
 73    pub fn new(http_client: Arc<dyn HttpClient>, cx: &mut App) -> Self {
 74        let state = cx.new(|cx| {
 75            cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
 76                let api_url = Self::api_url(cx);
 77                this.api_key_state
 78                    .handle_url_change(api_url, |this| &mut this.api_key_state, cx);
 79                cx.notify();
 80            })
 81            .detach();
 82            State {
 83                api_key_state: ApiKeyState::new(Self::api_url(cx), (*API_KEY_ENV_VAR).clone()),
 84            }
 85        });
 86
 87        Self { http_client, state }
 88    }
 89
 90    fn create_language_model(&self, model: deepseek::Model) -> Arc<dyn LanguageModel> {
 91        Arc::new(DeepSeekLanguageModel {
 92            id: LanguageModelId::from(model.id().to_string()),
 93            model,
 94            state: self.state.clone(),
 95            http_client: self.http_client.clone(),
 96            request_limiter: RateLimiter::new(4),
 97        })
 98    }
 99
100    fn settings(cx: &App) -> &DeepSeekSettings {
101        &crate::AllLanguageModelSettings::get_global(cx).deepseek
102    }
103
104    fn api_url(cx: &App) -> SharedString {
105        let api_url = &Self::settings(cx).api_url;
106        if api_url.is_empty() {
107            DEEPSEEK_API_URL.into()
108        } else {
109            SharedString::new(api_url.as_str())
110        }
111    }
112}
113
114impl LanguageModelProviderState for DeepSeekLanguageModelProvider {
115    type ObservableEntity = State;
116
117    fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
118        Some(self.state.clone())
119    }
120}
121
122impl LanguageModelProvider for DeepSeekLanguageModelProvider {
123    fn id(&self) -> LanguageModelProviderId {
124        PROVIDER_ID
125    }
126
127    fn name(&self) -> LanguageModelProviderName {
128        PROVIDER_NAME
129    }
130
131    fn icon(&self) -> IconOrSvg {
132        IconOrSvg::Icon(IconName::AiDeepSeek)
133    }
134
135    fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
136        Some(self.create_language_model(deepseek::Model::default()))
137    }
138
139    fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
140        Some(self.create_language_model(deepseek::Model::default_fast()))
141    }
142
143    fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
144        let mut models = BTreeMap::default();
145
146        models.insert("deepseek-chat", deepseek::Model::Chat);
147        models.insert("deepseek-reasoner", deepseek::Model::Reasoner);
148
149        for available_model in &Self::settings(cx).available_models {
150            models.insert(
151                &available_model.name,
152                deepseek::Model::Custom {
153                    name: available_model.name.clone(),
154                    display_name: available_model.display_name.clone(),
155                    max_tokens: available_model.max_tokens,
156                    max_output_tokens: available_model.max_output_tokens,
157                },
158            );
159        }
160
161        models
162            .into_values()
163            .map(|model| self.create_language_model(model))
164            .collect()
165    }
166
167    fn is_authenticated(&self, cx: &App) -> bool {
168        self.state.read(cx).is_authenticated()
169    }
170
171    fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
172        self.state.update(cx, |state, cx| state.authenticate(cx))
173    }
174
175    fn configuration_view(
176        &self,
177        _target_agent: language_model::ConfigurationViewTargetAgent,
178        window: &mut Window,
179        cx: &mut App,
180    ) -> AnyView {
181        cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
182            .into()
183    }
184
185    fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
186        self.state
187            .update(cx, |state, cx| state.set_api_key(None, cx))
188    }
189}
190
191pub struct DeepSeekLanguageModel {
192    id: LanguageModelId,
193    model: deepseek::Model,
194    state: Entity<State>,
195    http_client: Arc<dyn HttpClient>,
196    request_limiter: RateLimiter,
197}
198
199impl DeepSeekLanguageModel {
200    fn stream_completion(
201        &self,
202        request: deepseek::Request,
203        cx: &AsyncApp,
204    ) -> BoxFuture<'static, Result<BoxStream<'static, Result<deepseek::StreamResponse>>>> {
205        let http_client = self.http_client.clone();
206
207        let (api_key, api_url) = self.state.read_with(cx, |state, cx| {
208            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
209            (state.api_key_state.key(&api_url), api_url)
210        });
211
212        let future = self.request_limiter.stream(async move {
213            let Some(api_key) = api_key else {
214                return Err(LanguageModelCompletionError::NoApiKey {
215                    provider: PROVIDER_NAME,
216                });
217            };
218            let request =
219                deepseek::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
220            let response = request.await?;
221            Ok(response)
222        });
223
224        async move { Ok(future.await?.boxed()) }.boxed()
225    }
226}
227
228impl LanguageModel for DeepSeekLanguageModel {
229    fn id(&self) -> LanguageModelId {
230        self.id.clone()
231    }
232
233    fn name(&self) -> LanguageModelName {
234        LanguageModelName::from(self.model.display_name().to_string())
235    }
236
237    fn provider_id(&self) -> LanguageModelProviderId {
238        PROVIDER_ID
239    }
240
241    fn provider_name(&self) -> LanguageModelProviderName {
242        PROVIDER_NAME
243    }
244
245    fn supports_tools(&self) -> bool {
246        true
247    }
248
249    fn supports_streaming_tools(&self) -> bool {
250        true
251    }
252
253    fn supports_tool_choice(&self, _choice: LanguageModelToolChoice) -> bool {
254        true
255    }
256
257    fn supports_images(&self) -> bool {
258        false
259    }
260
261    fn telemetry_id(&self) -> String {
262        format!("deepseek/{}", self.model.id())
263    }
264
265    fn max_token_count(&self) -> u64 {
266        self.model.max_token_count()
267    }
268
269    fn max_output_tokens(&self) -> Option<u64> {
270        self.model.max_output_tokens()
271    }
272
273    fn count_tokens(
274        &self,
275        request: LanguageModelRequest,
276        cx: &App,
277    ) -> BoxFuture<'static, Result<u64>> {
278        cx.background_spawn(async move {
279            let messages = request
280                .messages
281                .into_iter()
282                .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
283                    role: match message.role {
284                        Role::User => "user".into(),
285                        Role::Assistant => "assistant".into(),
286                        Role::System => "system".into(),
287                    },
288                    content: Some(message.string_contents()),
289                    name: None,
290                    function_call: None,
291                })
292                .collect::<Vec<_>>();
293
294            tiktoken_rs::num_tokens_from_messages("gpt-4", &messages).map(|tokens| tokens as u64)
295        })
296        .boxed()
297    }
298
299    fn stream_completion(
300        &self,
301        request: LanguageModelRequest,
302        cx: &AsyncApp,
303    ) -> BoxFuture<
304        'static,
305        Result<
306            BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
307            LanguageModelCompletionError,
308        >,
309    > {
310        let request = into_deepseek(request, &self.model, self.max_output_tokens());
311        let stream = self.stream_completion(request, cx);
312
313        async move {
314            let mapper = DeepSeekEventMapper::new();
315            Ok(mapper.map_stream(stream.await?).boxed())
316        }
317        .boxed()
318    }
319}
320
321pub fn into_deepseek(
322    request: LanguageModelRequest,
323    model: &deepseek::Model,
324    max_output_tokens: Option<u64>,
325) -> deepseek::Request {
326    let is_reasoner = model == &deepseek::Model::Reasoner;
327
328    let mut messages = Vec::new();
329    let mut current_reasoning: Option<String> = None;
330
331    for message in request.messages {
332        for content in message.content {
333            match content {
334                MessageContent::Text(text) => {
335                    let should_add = if message.role == Role::User {
336                        !text.trim().is_empty()
337                    } else {
338                        !text.is_empty()
339                    };
340
341                    if should_add {
342                        messages.push(match message.role {
343                            Role::User => deepseek::RequestMessage::User { content: text },
344                            Role::Assistant => deepseek::RequestMessage::Assistant {
345                                content: Some(text),
346                                tool_calls: Vec::new(),
347                                reasoning_content: current_reasoning.take(),
348                            },
349                            Role::System => deepseek::RequestMessage::System { content: text },
350                        });
351                    }
352                }
353                MessageContent::Thinking { text, .. } => {
354                    // Accumulate reasoning content for next assistant message
355                    current_reasoning.get_or_insert_default().push_str(&text);
356                }
357                MessageContent::RedactedThinking(_) => {}
358                MessageContent::Image(_) => {}
359                MessageContent::ToolUse(tool_use) => {
360                    let tool_call = deepseek::ToolCall {
361                        id: tool_use.id.to_string(),
362                        content: deepseek::ToolCallContent::Function {
363                            function: deepseek::FunctionContent {
364                                name: tool_use.name.to_string(),
365                                arguments: serde_json::to_string(&tool_use.input)
366                                    .unwrap_or_default(),
367                            },
368                        },
369                    };
370
371                    if let Some(deepseek::RequestMessage::Assistant { tool_calls, .. }) =
372                        messages.last_mut()
373                    {
374                        tool_calls.push(tool_call);
375                    } else {
376                        messages.push(deepseek::RequestMessage::Assistant {
377                            content: None,
378                            tool_calls: vec![tool_call],
379                            reasoning_content: current_reasoning.take(),
380                        });
381                    }
382                }
383                MessageContent::ToolResult(tool_result) => {
384                    match &tool_result.content {
385                        LanguageModelToolResultContent::Text(text) => {
386                            messages.push(deepseek::RequestMessage::Tool {
387                                content: text.to_string(),
388                                tool_call_id: tool_result.tool_use_id.to_string(),
389                            });
390                        }
391                        LanguageModelToolResultContent::Image(_) => {}
392                    };
393                }
394            }
395        }
396    }
397
398    deepseek::Request {
399        model: model.id().to_string(),
400        messages,
401        stream: true,
402        max_tokens: max_output_tokens,
403        temperature: if is_reasoner {
404            None
405        } else {
406            request.temperature
407        },
408        response_format: None,
409        tools: request
410            .tools
411            .into_iter()
412            .map(|tool| deepseek::ToolDefinition::Function {
413                function: deepseek::FunctionDefinition {
414                    name: tool.name,
415                    description: Some(tool.description),
416                    parameters: Some(tool.input_schema),
417                },
418            })
419            .collect(),
420    }
421}
422
423pub struct DeepSeekEventMapper {
424    tool_calls_by_index: HashMap<usize, RawToolCall>,
425}
426
427impl DeepSeekEventMapper {
428    pub fn new() -> Self {
429        Self {
430            tool_calls_by_index: HashMap::default(),
431        }
432    }
433
434    pub fn map_stream(
435        mut self,
436        events: Pin<Box<dyn Send + Stream<Item = Result<deepseek::StreamResponse>>>>,
437    ) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>
438    {
439        events.flat_map(move |event| {
440            futures::stream::iter(match event {
441                Ok(event) => self.map_event(event),
442                Err(error) => vec![Err(LanguageModelCompletionError::from(error))],
443            })
444        })
445    }
446
447    pub fn map_event(
448        &mut self,
449        event: deepseek::StreamResponse,
450    ) -> Vec<Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
451        let Some(choice) = event.choices.first() else {
452            return vec![Err(LanguageModelCompletionError::from(anyhow!(
453                "Response contained no choices"
454            )))];
455        };
456
457        let mut events = Vec::new();
458        if let Some(content) = choice.delta.content.clone()
459            && !content.is_empty()
460        {
461            events.push(Ok(LanguageModelCompletionEvent::Text(content)));
462        }
463
464        if let Some(reasoning_content) = choice.delta.reasoning_content.clone() {
465            events.push(Ok(LanguageModelCompletionEvent::Thinking {
466                text: reasoning_content,
467                signature: None,
468            }));
469        }
470
471        if let Some(tool_calls) = choice.delta.tool_calls.as_ref() {
472            for tool_call in tool_calls {
473                let entry = self.tool_calls_by_index.entry(tool_call.index).or_default();
474
475                if let Some(tool_id) = tool_call.id.clone() {
476                    entry.id = tool_id;
477                }
478
479                if let Some(function) = tool_call.function.as_ref() {
480                    if let Some(name) = function.name.clone() {
481                        entry.name = name;
482                    }
483
484                    if let Some(arguments) = function.arguments.clone() {
485                        entry.arguments.push_str(&arguments);
486                    }
487                }
488
489                if !entry.id.is_empty() && !entry.name.is_empty() {
490                    if let Ok(input) = serde_json::from_str::<serde_json::Value>(
491                        &fix_streamed_json(&entry.arguments),
492                    ) {
493                        events.push(Ok(LanguageModelCompletionEvent::ToolUse(
494                            LanguageModelToolUse {
495                                id: entry.id.clone().into(),
496                                name: entry.name.as_str().into(),
497                                is_input_complete: false,
498                                input,
499                                raw_input: entry.arguments.clone(),
500                                thought_signature: None,
501                            },
502                        )));
503                    }
504                }
505            }
506        }
507
508        if let Some(usage) = event.usage {
509            events.push(Ok(LanguageModelCompletionEvent::UsageUpdate(TokenUsage {
510                input_tokens: usage.prompt_tokens,
511                output_tokens: usage.completion_tokens,
512                cache_creation_input_tokens: 0,
513                cache_read_input_tokens: 0,
514            })));
515        }
516
517        match choice.finish_reason.as_deref() {
518            Some("stop") => {
519                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
520            }
521            Some("tool_calls") => {
522                events.extend(self.tool_calls_by_index.drain().map(|(_, tool_call)| {
523                    match parse_tool_arguments(&tool_call.arguments) {
524                        Ok(input) => Ok(LanguageModelCompletionEvent::ToolUse(
525                            LanguageModelToolUse {
526                                id: tool_call.id.clone().into(),
527                                name: tool_call.name.as_str().into(),
528                                is_input_complete: true,
529                                input,
530                                raw_input: tool_call.arguments.clone(),
531                                thought_signature: None,
532                            },
533                        )),
534                        Err(error) => Ok(LanguageModelCompletionEvent::ToolUseJsonParseError {
535                            id: tool_call.id.clone().into(),
536                            tool_name: tool_call.name.as_str().into(),
537                            raw_input: tool_call.arguments.into(),
538                            json_parse_error: error.to_string(),
539                        }),
540                    }
541                }));
542
543                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::ToolUse)));
544            }
545            Some(stop_reason) => {
546                log::error!("Unexpected DeepSeek stop_reason: {stop_reason:?}",);
547                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
548            }
549            None => {}
550        }
551
552        events
553    }
554}
555
556struct ConfigurationView {
557    api_key_editor: Entity<InputField>,
558    state: Entity<State>,
559    load_credentials_task: Option<Task<()>>,
560}
561
562impl ConfigurationView {
563    fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
564        let api_key_editor =
565            cx.new(|cx| InputField::new(window, cx, "sk-00000000000000000000000000000000"));
566
567        cx.observe(&state, |_, _, cx| {
568            cx.notify();
569        })
570        .detach();
571
572        let load_credentials_task = Some(cx.spawn({
573            let state = state.clone();
574            async move |this, cx| {
575                if let Some(task) = Some(state.update(cx, |state, cx| state.authenticate(cx))) {
576                    let _ = task.await;
577                }
578
579                this.update(cx, |this, cx| {
580                    this.load_credentials_task = None;
581                    cx.notify();
582                })
583                .log_err();
584            }
585        }));
586
587        Self {
588            api_key_editor,
589            state,
590            load_credentials_task,
591        }
592    }
593
594    fn save_api_key(&mut self, _: &menu::Confirm, _window: &mut Window, cx: &mut Context<Self>) {
595        let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
596        if api_key.is_empty() {
597            return;
598        }
599
600        let state = self.state.clone();
601        cx.spawn(async move |_, cx| {
602            state
603                .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))
604                .await
605        })
606        .detach_and_log_err(cx);
607    }
608
609    fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
610        self.api_key_editor
611            .update(cx, |editor, cx| editor.set_text("", window, cx));
612
613        let state = self.state.clone();
614        cx.spawn(async move |_, cx| {
615            state
616                .update(cx, |state, cx| state.set_api_key(None, cx))
617                .await
618        })
619        .detach_and_log_err(cx);
620    }
621
622    fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
623        !self.state.read(cx).is_authenticated()
624    }
625}
626
627impl Render for ConfigurationView {
628    fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
629        let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
630        let configured_card_label = if env_var_set {
631            format!("API key set in {API_KEY_ENV_VAR_NAME} environment variable")
632        } else {
633            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
634            if api_url == DEEPSEEK_API_URL {
635                "API key configured".to_string()
636            } else {
637                format!("API key configured for {}", api_url)
638            }
639        };
640
641        if self.load_credentials_task.is_some() {
642            div()
643                .child(Label::new("Loading credentials..."))
644                .into_any_element()
645        } else if self.should_render_editor(cx) {
646            v_flex()
647                .size_full()
648                .on_action(cx.listener(Self::save_api_key))
649                .child(Label::new("To use DeepSeek in Zed, you need an API key:"))
650                .child(
651                    List::new()
652                        .child(
653                            ListBulletItem::new("")
654                                .child(Label::new("Get your API key from the"))
655                                .child(ButtonLink::new(
656                                    "DeepSeek console",
657                                    "https://platform.deepseek.com/api_keys",
658                                )),
659                        )
660                        .child(ListBulletItem::new(
661                            "Paste your API key below and hit enter to start using the assistant",
662                        )),
663                )
664                .child(self.api_key_editor.clone())
665                .child(
666                    Label::new(format!(
667                        "You can also set the {API_KEY_ENV_VAR_NAME} environment variable and restart Zed."
668                    ))
669                    .size(LabelSize::Small)
670                    .color(Color::Muted),
671                )
672                .into_any_element()
673        } else {
674            ConfiguredApiCard::new(configured_card_label)
675                .disabled(env_var_set)
676                .on_click(cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)))
677                .into_any_element()
678        }
679    }
680}