deepseek.rs

  1use anyhow::{Result, anyhow};
  2use collections::{BTreeMap, HashMap};
  3use credentials_provider::CredentialsProvider;
  4use deepseek::DEEPSEEK_API_URL;
  5
  6use futures::Stream;
  7use futures::{FutureExt, StreamExt, future::BoxFuture, stream::BoxStream};
  8use gpui::{AnyView, App, AsyncApp, Context, Entity, SharedString, Task, Window};
  9use http_client::HttpClient;
 10use language_model::{
 11    ApiKeyState, AuthenticateError, EnvVar, IconOrSvg, LanguageModel, LanguageModelCompletionError,
 12    LanguageModelCompletionEvent, LanguageModelId, LanguageModelName, LanguageModelProvider,
 13    LanguageModelProviderId, LanguageModelProviderName, LanguageModelProviderState,
 14    LanguageModelRequest, LanguageModelToolChoice, LanguageModelToolResultContent,
 15    LanguageModelToolUse, MessageContent, RateLimiter, Role, StopReason, TokenUsage, env_var,
 16};
 17pub use settings::DeepseekAvailableModel as AvailableModel;
 18use settings::{Settings, SettingsStore};
 19use std::pin::Pin;
 20use std::sync::{Arc, LazyLock};
 21
 22use ui::{ButtonLink, ConfiguredApiCard, List, ListBulletItem, prelude::*};
 23use ui_input::InputField;
 24use util::ResultExt;
 25
 26use language_model::util::{fix_streamed_json, parse_tool_arguments};
 27
 28const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("deepseek");
 29const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("DeepSeek");
 30
 31const API_KEY_ENV_VAR_NAME: &str = "DEEPSEEK_API_KEY";
 32static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
 33
 34#[derive(Default)]
 35struct RawToolCall {
 36    id: String,
 37    name: String,
 38    arguments: String,
 39}
 40
 41#[derive(Default, Clone, Debug, PartialEq)]
 42pub struct DeepSeekSettings {
 43    pub api_url: String,
 44    pub available_models: Vec<AvailableModel>,
 45}
 46pub struct DeepSeekLanguageModelProvider {
 47    http_client: Arc<dyn HttpClient>,
 48    state: Entity<State>,
 49}
 50
 51pub struct State {
 52    api_key_state: ApiKeyState,
 53    credentials_provider: Arc<dyn CredentialsProvider>,
 54}
 55
 56impl State {
 57    fn is_authenticated(&self) -> bool {
 58        self.api_key_state.has_key()
 59    }
 60
 61    fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
 62        let credentials_provider = self.credentials_provider.clone();
 63        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 64        self.api_key_state.store(
 65            api_url,
 66            api_key,
 67            |this| &mut this.api_key_state,
 68            credentials_provider,
 69            cx,
 70        )
 71    }
 72
 73    fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
 74        let credentials_provider = self.credentials_provider.clone();
 75        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 76        self.api_key_state.load_if_needed(
 77            api_url,
 78            |this| &mut this.api_key_state,
 79            credentials_provider,
 80            cx,
 81        )
 82    }
 83}
 84
 85impl DeepSeekLanguageModelProvider {
 86    pub fn new(
 87        http_client: Arc<dyn HttpClient>,
 88        credentials_provider: Arc<dyn CredentialsProvider>,
 89        cx: &mut App,
 90    ) -> Self {
 91        let state = cx.new(|cx| {
 92            cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
 93                let credentials_provider = this.credentials_provider.clone();
 94                let api_url = Self::api_url(cx);
 95                this.api_key_state.handle_url_change(
 96                    api_url,
 97                    |this| &mut this.api_key_state,
 98                    credentials_provider,
 99                    cx,
100                );
101                cx.notify();
102            })
103            .detach();
104            State {
105                api_key_state: ApiKeyState::new(Self::api_url(cx), (*API_KEY_ENV_VAR).clone()),
106                credentials_provider,
107            }
108        });
109
110        Self { http_client, state }
111    }
112
113    fn create_language_model(&self, model: deepseek::Model) -> Arc<dyn LanguageModel> {
114        Arc::new(DeepSeekLanguageModel {
115            id: LanguageModelId::from(model.id().to_string()),
116            model,
117            state: self.state.clone(),
118            http_client: self.http_client.clone(),
119            request_limiter: RateLimiter::new(4),
120        })
121    }
122
123    fn settings(cx: &App) -> &DeepSeekSettings {
124        &crate::AllLanguageModelSettings::get_global(cx).deepseek
125    }
126
127    fn api_url(cx: &App) -> SharedString {
128        let api_url = &Self::settings(cx).api_url;
129        if api_url.is_empty() {
130            DEEPSEEK_API_URL.into()
131        } else {
132            SharedString::new(api_url.as_str())
133        }
134    }
135}
136
137impl LanguageModelProviderState for DeepSeekLanguageModelProvider {
138    type ObservableEntity = State;
139
140    fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
141        Some(self.state.clone())
142    }
143}
144
145impl LanguageModelProvider for DeepSeekLanguageModelProvider {
146    fn id(&self) -> LanguageModelProviderId {
147        PROVIDER_ID
148    }
149
150    fn name(&self) -> LanguageModelProviderName {
151        PROVIDER_NAME
152    }
153
154    fn icon(&self) -> IconOrSvg {
155        IconOrSvg::Icon(IconName::AiDeepSeek)
156    }
157
158    fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
159        Some(self.create_language_model(deepseek::Model::default()))
160    }
161
162    fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
163        Some(self.create_language_model(deepseek::Model::default_fast()))
164    }
165
166    fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
167        let mut models = BTreeMap::default();
168
169        models.insert("deepseek-chat", deepseek::Model::Chat);
170        models.insert("deepseek-reasoner", deepseek::Model::Reasoner);
171
172        for available_model in &Self::settings(cx).available_models {
173            models.insert(
174                &available_model.name,
175                deepseek::Model::Custom {
176                    name: available_model.name.clone(),
177                    display_name: available_model.display_name.clone(),
178                    max_tokens: available_model.max_tokens,
179                    max_output_tokens: available_model.max_output_tokens,
180                },
181            );
182        }
183
184        models
185            .into_values()
186            .map(|model| self.create_language_model(model))
187            .collect()
188    }
189
190    fn is_authenticated(&self, cx: &App) -> bool {
191        self.state.read(cx).is_authenticated()
192    }
193
194    fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
195        self.state.update(cx, |state, cx| state.authenticate(cx))
196    }
197
198    fn configuration_view(
199        &self,
200        _target_agent: language_model::ConfigurationViewTargetAgent,
201        window: &mut Window,
202        cx: &mut App,
203    ) -> AnyView {
204        cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
205            .into()
206    }
207
208    fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
209        self.state
210            .update(cx, |state, cx| state.set_api_key(None, cx))
211    }
212}
213
214pub struct DeepSeekLanguageModel {
215    id: LanguageModelId,
216    model: deepseek::Model,
217    state: Entity<State>,
218    http_client: Arc<dyn HttpClient>,
219    request_limiter: RateLimiter,
220}
221
222impl DeepSeekLanguageModel {
223    fn stream_completion(
224        &self,
225        request: deepseek::Request,
226        cx: &AsyncApp,
227    ) -> BoxFuture<'static, Result<BoxStream<'static, Result<deepseek::StreamResponse>>>> {
228        let http_client = self.http_client.clone();
229
230        let (api_key, api_url) = self.state.read_with(cx, |state, cx| {
231            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
232            (state.api_key_state.key(&api_url), api_url)
233        });
234
235        let future = self.request_limiter.stream(async move {
236            let Some(api_key) = api_key else {
237                return Err(LanguageModelCompletionError::NoApiKey {
238                    provider: PROVIDER_NAME,
239                });
240            };
241            let request =
242                deepseek::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
243            let response = request.await?;
244            Ok(response)
245        });
246
247        async move { Ok(future.await?.boxed()) }.boxed()
248    }
249}
250
251impl LanguageModel for DeepSeekLanguageModel {
252    fn id(&self) -> LanguageModelId {
253        self.id.clone()
254    }
255
256    fn name(&self) -> LanguageModelName {
257        LanguageModelName::from(self.model.display_name().to_string())
258    }
259
260    fn provider_id(&self) -> LanguageModelProviderId {
261        PROVIDER_ID
262    }
263
264    fn provider_name(&self) -> LanguageModelProviderName {
265        PROVIDER_NAME
266    }
267
268    fn supports_tools(&self) -> bool {
269        true
270    }
271
272    fn supports_streaming_tools(&self) -> bool {
273        true
274    }
275
276    fn supports_tool_choice(&self, _choice: LanguageModelToolChoice) -> bool {
277        true
278    }
279
280    fn supports_images(&self) -> bool {
281        false
282    }
283
284    fn telemetry_id(&self) -> String {
285        format!("deepseek/{}", self.model.id())
286    }
287
288    fn max_token_count(&self) -> u64 {
289        self.model.max_token_count()
290    }
291
292    fn max_output_tokens(&self) -> Option<u64> {
293        self.model.max_output_tokens()
294    }
295
296    fn count_tokens(
297        &self,
298        request: LanguageModelRequest,
299        cx: &App,
300    ) -> BoxFuture<'static, Result<u64>> {
301        cx.background_spawn(async move {
302            let messages = request
303                .messages
304                .into_iter()
305                .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
306                    role: match message.role {
307                        Role::User => "user".into(),
308                        Role::Assistant => "assistant".into(),
309                        Role::System => "system".into(),
310                    },
311                    content: Some(message.string_contents()),
312                    name: None,
313                    function_call: None,
314                })
315                .collect::<Vec<_>>();
316
317            tiktoken_rs::num_tokens_from_messages("gpt-4", &messages).map(|tokens| tokens as u64)
318        })
319        .boxed()
320    }
321
322    fn stream_completion(
323        &self,
324        request: LanguageModelRequest,
325        cx: &AsyncApp,
326    ) -> BoxFuture<
327        'static,
328        Result<
329            BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
330            LanguageModelCompletionError,
331        >,
332    > {
333        let request = into_deepseek(request, &self.model, self.max_output_tokens());
334        let stream = self.stream_completion(request, cx);
335
336        async move {
337            let mapper = DeepSeekEventMapper::new();
338            Ok(mapper.map_stream(stream.await?).boxed())
339        }
340        .boxed()
341    }
342}
343
344pub fn into_deepseek(
345    request: LanguageModelRequest,
346    model: &deepseek::Model,
347    max_output_tokens: Option<u64>,
348) -> deepseek::Request {
349    let is_reasoner = model == &deepseek::Model::Reasoner;
350
351    let mut messages = Vec::new();
352    let mut current_reasoning: Option<String> = None;
353
354    for message in request.messages {
355        for content in message.content {
356            match content {
357                MessageContent::Text(text) => {
358                    let should_add = if message.role == Role::User {
359                        !text.trim().is_empty()
360                    } else {
361                        !text.is_empty()
362                    };
363
364                    if should_add {
365                        messages.push(match message.role {
366                            Role::User => deepseek::RequestMessage::User { content: text },
367                            Role::Assistant => deepseek::RequestMessage::Assistant {
368                                content: Some(text),
369                                tool_calls: Vec::new(),
370                                reasoning_content: current_reasoning.take(),
371                            },
372                            Role::System => deepseek::RequestMessage::System { content: text },
373                        });
374                    }
375                }
376                MessageContent::Thinking { text, .. } => {
377                    // Accumulate reasoning content for next assistant message
378                    current_reasoning.get_or_insert_default().push_str(&text);
379                }
380                MessageContent::RedactedThinking(_) => {}
381                MessageContent::Image(_) => {}
382                MessageContent::ToolUse(tool_use) => {
383                    let tool_call = deepseek::ToolCall {
384                        id: tool_use.id.to_string(),
385                        content: deepseek::ToolCallContent::Function {
386                            function: deepseek::FunctionContent {
387                                name: tool_use.name.to_string(),
388                                arguments: serde_json::to_string(&tool_use.input)
389                                    .unwrap_or_default(),
390                            },
391                        },
392                    };
393
394                    if let Some(deepseek::RequestMessage::Assistant { tool_calls, .. }) =
395                        messages.last_mut()
396                    {
397                        tool_calls.push(tool_call);
398                    } else {
399                        messages.push(deepseek::RequestMessage::Assistant {
400                            content: None,
401                            tool_calls: vec![tool_call],
402                            reasoning_content: current_reasoning.take(),
403                        });
404                    }
405                }
406                MessageContent::ToolResult(tool_result) => {
407                    match &tool_result.content {
408                        LanguageModelToolResultContent::Text(text) => {
409                            messages.push(deepseek::RequestMessage::Tool {
410                                content: text.to_string(),
411                                tool_call_id: tool_result.tool_use_id.to_string(),
412                            });
413                        }
414                        LanguageModelToolResultContent::Image(_) => {}
415                    };
416                }
417            }
418        }
419    }
420
421    deepseek::Request {
422        model: model.id().to_string(),
423        messages,
424        stream: true,
425        max_tokens: max_output_tokens,
426        temperature: if is_reasoner {
427            None
428        } else {
429            request.temperature
430        },
431        response_format: None,
432        tools: request
433            .tools
434            .into_iter()
435            .map(|tool| deepseek::ToolDefinition::Function {
436                function: deepseek::FunctionDefinition {
437                    name: tool.name,
438                    description: Some(tool.description),
439                    parameters: Some(tool.input_schema),
440                },
441            })
442            .collect(),
443    }
444}
445
446pub struct DeepSeekEventMapper {
447    tool_calls_by_index: HashMap<usize, RawToolCall>,
448}
449
450impl DeepSeekEventMapper {
451    pub fn new() -> Self {
452        Self {
453            tool_calls_by_index: HashMap::default(),
454        }
455    }
456
457    pub fn map_stream(
458        mut self,
459        events: Pin<Box<dyn Send + Stream<Item = Result<deepseek::StreamResponse>>>>,
460    ) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>
461    {
462        events.flat_map(move |event| {
463            futures::stream::iter(match event {
464                Ok(event) => self.map_event(event),
465                Err(error) => vec![Err(LanguageModelCompletionError::from(error))],
466            })
467        })
468    }
469
470    pub fn map_event(
471        &mut self,
472        event: deepseek::StreamResponse,
473    ) -> Vec<Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
474        let Some(choice) = event.choices.first() else {
475            return vec![Err(LanguageModelCompletionError::from(anyhow!(
476                "Response contained no choices"
477            )))];
478        };
479
480        let mut events = Vec::new();
481        if let Some(content) = choice.delta.content.clone()
482            && !content.is_empty()
483        {
484            events.push(Ok(LanguageModelCompletionEvent::Text(content)));
485        }
486
487        if let Some(reasoning_content) = choice.delta.reasoning_content.clone() {
488            events.push(Ok(LanguageModelCompletionEvent::Thinking {
489                text: reasoning_content,
490                signature: None,
491            }));
492        }
493
494        if let Some(tool_calls) = choice.delta.tool_calls.as_ref() {
495            for tool_call in tool_calls {
496                let entry = self.tool_calls_by_index.entry(tool_call.index).or_default();
497
498                if let Some(tool_id) = tool_call.id.clone() {
499                    entry.id = tool_id;
500                }
501
502                if let Some(function) = tool_call.function.as_ref() {
503                    if let Some(name) = function.name.clone() {
504                        entry.name = name;
505                    }
506
507                    if let Some(arguments) = function.arguments.clone() {
508                        entry.arguments.push_str(&arguments);
509                    }
510                }
511
512                if !entry.id.is_empty() && !entry.name.is_empty() {
513                    if let Ok(input) = serde_json::from_str::<serde_json::Value>(
514                        &fix_streamed_json(&entry.arguments),
515                    ) {
516                        events.push(Ok(LanguageModelCompletionEvent::ToolUse(
517                            LanguageModelToolUse {
518                                id: entry.id.clone().into(),
519                                name: entry.name.as_str().into(),
520                                is_input_complete: false,
521                                input,
522                                raw_input: entry.arguments.clone(),
523                                thought_signature: None,
524                            },
525                        )));
526                    }
527                }
528            }
529        }
530
531        if let Some(usage) = event.usage {
532            events.push(Ok(LanguageModelCompletionEvent::UsageUpdate(TokenUsage {
533                input_tokens: usage.prompt_tokens,
534                output_tokens: usage.completion_tokens,
535                cache_creation_input_tokens: 0,
536                cache_read_input_tokens: 0,
537            })));
538        }
539
540        match choice.finish_reason.as_deref() {
541            Some("stop") => {
542                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
543            }
544            Some("tool_calls") => {
545                events.extend(self.tool_calls_by_index.drain().map(|(_, tool_call)| {
546                    match parse_tool_arguments(&tool_call.arguments) {
547                        Ok(input) => Ok(LanguageModelCompletionEvent::ToolUse(
548                            LanguageModelToolUse {
549                                id: tool_call.id.clone().into(),
550                                name: tool_call.name.as_str().into(),
551                                is_input_complete: true,
552                                input,
553                                raw_input: tool_call.arguments.clone(),
554                                thought_signature: None,
555                            },
556                        )),
557                        Err(error) => Ok(LanguageModelCompletionEvent::ToolUseJsonParseError {
558                            id: tool_call.id.clone().into(),
559                            tool_name: tool_call.name.as_str().into(),
560                            raw_input: tool_call.arguments.into(),
561                            json_parse_error: error.to_string(),
562                        }),
563                    }
564                }));
565
566                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::ToolUse)));
567            }
568            Some(stop_reason) => {
569                log::error!("Unexpected DeepSeek stop_reason: {stop_reason:?}",);
570                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
571            }
572            None => {}
573        }
574
575        events
576    }
577}
578
579struct ConfigurationView {
580    api_key_editor: Entity<InputField>,
581    state: Entity<State>,
582    load_credentials_task: Option<Task<()>>,
583}
584
585impl ConfigurationView {
586    fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
587        let api_key_editor =
588            cx.new(|cx| InputField::new(window, cx, "sk-00000000000000000000000000000000"));
589
590        cx.observe(&state, |_, _, cx| {
591            cx.notify();
592        })
593        .detach();
594
595        let load_credentials_task = Some(cx.spawn({
596            let state = state.clone();
597            async move |this, cx| {
598                if let Some(task) = Some(state.update(cx, |state, cx| state.authenticate(cx))) {
599                    let _ = task.await;
600                }
601
602                this.update(cx, |this, cx| {
603                    this.load_credentials_task = None;
604                    cx.notify();
605                })
606                .log_err();
607            }
608        }));
609
610        Self {
611            api_key_editor,
612            state,
613            load_credentials_task,
614        }
615    }
616
617    fn save_api_key(&mut self, _: &menu::Confirm, _window: &mut Window, cx: &mut Context<Self>) {
618        let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
619        if api_key.is_empty() {
620            return;
621        }
622
623        let state = self.state.clone();
624        cx.spawn(async move |_, cx| {
625            state
626                .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))
627                .await
628        })
629        .detach_and_log_err(cx);
630    }
631
632    fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
633        self.api_key_editor
634            .update(cx, |editor, cx| editor.set_text("", window, cx));
635
636        let state = self.state.clone();
637        cx.spawn(async move |_, cx| {
638            state
639                .update(cx, |state, cx| state.set_api_key(None, cx))
640                .await
641        })
642        .detach_and_log_err(cx);
643    }
644
645    fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
646        !self.state.read(cx).is_authenticated()
647    }
648}
649
650impl Render for ConfigurationView {
651    fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
652        let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
653        let configured_card_label = if env_var_set {
654            format!("API key set in {API_KEY_ENV_VAR_NAME} environment variable")
655        } else {
656            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
657            if api_url == DEEPSEEK_API_URL {
658                "API key configured".to_string()
659            } else {
660                format!("API key configured for {}", api_url)
661            }
662        };
663
664        if self.load_credentials_task.is_some() {
665            div()
666                .child(Label::new("Loading credentials..."))
667                .into_any_element()
668        } else if self.should_render_editor(cx) {
669            v_flex()
670                .size_full()
671                .on_action(cx.listener(Self::save_api_key))
672                .child(Label::new("To use DeepSeek in Zed, you need an API key:"))
673                .child(
674                    List::new()
675                        .child(
676                            ListBulletItem::new("")
677                                .child(Label::new("Get your API key from the"))
678                                .child(ButtonLink::new(
679                                    "DeepSeek console",
680                                    "https://platform.deepseek.com/api_keys",
681                                )),
682                        )
683                        .child(ListBulletItem::new(
684                            "Paste your API key below and hit enter to start using the assistant",
685                        )),
686                )
687                .child(self.api_key_editor.clone())
688                .child(
689                    Label::new(format!(
690                        "You can also set the {API_KEY_ENV_VAR_NAME} environment variable and restart Zed."
691                    ))
692                    .size(LabelSize::Small)
693                    .color(Color::Muted),
694                )
695                .into_any_element()
696        } else {
697            ConfiguredApiCard::new(configured_card_label)
698                .disabled(env_var_set)
699                .on_click(cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)))
700                .into_any_element()
701        }
702    }
703}