deepseek.rs

  1use anyhow::{Result, anyhow};
  2use collections::{BTreeMap, HashMap};
  3use deepseek::DEEPSEEK_API_URL;
  4
  5use futures::Stream;
  6use futures::{FutureExt, StreamExt, future::BoxFuture, stream::BoxStream};
  7use gpui::{AnyView, App, AsyncApp, Context, Entity, SharedString, Task, Window};
  8use http_client::HttpClient;
  9use language_model::{
 10    ApiKeyState, AuthenticateError, EnvVar, IconOrSvg, LanguageModel, LanguageModelCompletionError,
 11    LanguageModelCompletionEvent, LanguageModelId, LanguageModelName, LanguageModelProvider,
 12    LanguageModelProviderId, LanguageModelProviderName, LanguageModelProviderState,
 13    LanguageModelRequest, LanguageModelToolChoice, LanguageModelToolResultContent,
 14    LanguageModelToolUse, MessageContent, RateLimiter, Role, StopReason, TokenUsage, env_var,
 15};
 16pub use settings::DeepseekAvailableModel as AvailableModel;
 17use settings::{Settings, SettingsStore};
 18use std::pin::Pin;
 19use std::sync::{Arc, LazyLock};
 20
 21use ui::{ButtonLink, ConfiguredApiCard, List, ListBulletItem, prelude::*};
 22use ui_input::InputField;
 23use util::ResultExt;
 24
 25use crate::provider::util::parse_tool_arguments;
 26
 27const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("deepseek");
 28const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("DeepSeek");
 29
 30const API_KEY_ENV_VAR_NAME: &str = "DEEPSEEK_API_KEY";
 31static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
 32
 33#[derive(Default)]
 34struct RawToolCall {
 35    id: String,
 36    name: String,
 37    arguments: String,
 38}
 39
 40#[derive(Default, Clone, Debug, PartialEq)]
 41pub struct DeepSeekSettings {
 42    pub api_url: String,
 43    pub available_models: Vec<AvailableModel>,
 44}
 45pub struct DeepSeekLanguageModelProvider {
 46    http_client: Arc<dyn HttpClient>,
 47    state: Entity<State>,
 48}
 49
 50pub struct State {
 51    api_key_state: ApiKeyState,
 52}
 53
 54impl State {
 55    fn is_authenticated(&self) -> bool {
 56        self.api_key_state.has_key()
 57    }
 58
 59    fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
 60        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 61        self.api_key_state
 62            .store(api_url, api_key, |this| &mut this.api_key_state, cx)
 63    }
 64
 65    fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
 66        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 67        self.api_key_state
 68            .load_if_needed(api_url, |this| &mut this.api_key_state, cx)
 69    }
 70}
 71
 72impl DeepSeekLanguageModelProvider {
 73    pub fn new(http_client: Arc<dyn HttpClient>, cx: &mut App) -> Self {
 74        let state = cx.new(|cx| {
 75            cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
 76                let api_url = Self::api_url(cx);
 77                this.api_key_state
 78                    .handle_url_change(api_url, |this| &mut this.api_key_state, cx);
 79                cx.notify();
 80            })
 81            .detach();
 82            State {
 83                api_key_state: ApiKeyState::new(Self::api_url(cx), (*API_KEY_ENV_VAR).clone()),
 84            }
 85        });
 86
 87        Self { http_client, state }
 88    }
 89
 90    fn create_language_model(&self, model: deepseek::Model) -> Arc<dyn LanguageModel> {
 91        Arc::new(DeepSeekLanguageModel {
 92            id: LanguageModelId::from(model.id().to_string()),
 93            model,
 94            state: self.state.clone(),
 95            http_client: self.http_client.clone(),
 96            request_limiter: RateLimiter::new(4),
 97        })
 98    }
 99
100    fn settings(cx: &App) -> &DeepSeekSettings {
101        &crate::AllLanguageModelSettings::get_global(cx).deepseek
102    }
103
104    fn api_url(cx: &App) -> SharedString {
105        let api_url = &Self::settings(cx).api_url;
106        if api_url.is_empty() {
107            DEEPSEEK_API_URL.into()
108        } else {
109            SharedString::new(api_url.as_str())
110        }
111    }
112}
113
114impl LanguageModelProviderState for DeepSeekLanguageModelProvider {
115    type ObservableEntity = State;
116
117    fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
118        Some(self.state.clone())
119    }
120}
121
122impl LanguageModelProvider for DeepSeekLanguageModelProvider {
123    fn id(&self) -> LanguageModelProviderId {
124        PROVIDER_ID
125    }
126
127    fn name(&self) -> LanguageModelProviderName {
128        PROVIDER_NAME
129    }
130
131    fn icon(&self) -> IconOrSvg {
132        IconOrSvg::Icon(IconName::AiDeepSeek)
133    }
134
135    fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
136        Some(self.create_language_model(deepseek::Model::default()))
137    }
138
139    fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
140        Some(self.create_language_model(deepseek::Model::default_fast()))
141    }
142
143    fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
144        let mut models = BTreeMap::default();
145
146        models.insert("deepseek-chat", deepseek::Model::Chat);
147        models.insert("deepseek-reasoner", deepseek::Model::Reasoner);
148
149        for available_model in &Self::settings(cx).available_models {
150            models.insert(
151                &available_model.name,
152                deepseek::Model::Custom {
153                    name: available_model.name.clone(),
154                    display_name: available_model.display_name.clone(),
155                    max_tokens: available_model.max_tokens,
156                    max_output_tokens: available_model.max_output_tokens,
157                },
158            );
159        }
160
161        models
162            .into_values()
163            .map(|model| self.create_language_model(model))
164            .collect()
165    }
166
167    fn is_authenticated(&self, cx: &App) -> bool {
168        self.state.read(cx).is_authenticated()
169    }
170
171    fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
172        self.state.update(cx, |state, cx| state.authenticate(cx))
173    }
174
175    fn configuration_view(
176        &self,
177        _target_agent: language_model::ConfigurationViewTargetAgent,
178        window: &mut Window,
179        cx: &mut App,
180    ) -> AnyView {
181        cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
182            .into()
183    }
184
185    fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
186        self.state
187            .update(cx, |state, cx| state.set_api_key(None, cx))
188    }
189}
190
191pub struct DeepSeekLanguageModel {
192    id: LanguageModelId,
193    model: deepseek::Model,
194    state: Entity<State>,
195    http_client: Arc<dyn HttpClient>,
196    request_limiter: RateLimiter,
197}
198
199impl DeepSeekLanguageModel {
200    fn stream_completion(
201        &self,
202        request: deepseek::Request,
203        cx: &AsyncApp,
204    ) -> BoxFuture<'static, Result<BoxStream<'static, Result<deepseek::StreamResponse>>>> {
205        let http_client = self.http_client.clone();
206
207        let (api_key, api_url) = self.state.read_with(cx, |state, cx| {
208            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
209            (state.api_key_state.key(&api_url), api_url)
210        });
211
212        let future = self.request_limiter.stream(async move {
213            let Some(api_key) = api_key else {
214                return Err(LanguageModelCompletionError::NoApiKey {
215                    provider: PROVIDER_NAME,
216                });
217            };
218            let request =
219                deepseek::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
220            let response = request.await?;
221            Ok(response)
222        });
223
224        async move { Ok(future.await?.boxed()) }.boxed()
225    }
226}
227
228impl LanguageModel for DeepSeekLanguageModel {
229    fn id(&self) -> LanguageModelId {
230        self.id.clone()
231    }
232
233    fn name(&self) -> LanguageModelName {
234        LanguageModelName::from(self.model.display_name().to_string())
235    }
236
237    fn provider_id(&self) -> LanguageModelProviderId {
238        PROVIDER_ID
239    }
240
241    fn provider_name(&self) -> LanguageModelProviderName {
242        PROVIDER_NAME
243    }
244
245    fn supports_tools(&self) -> bool {
246        true
247    }
248
249    fn supports_streaming_tools(&self) -> bool {
250        true
251    }
252
253    fn supports_tool_choice(&self, _choice: LanguageModelToolChoice) -> bool {
254        true
255    }
256
257    fn supports_images(&self) -> bool {
258        false
259    }
260
261    fn telemetry_id(&self) -> String {
262        format!("deepseek/{}", self.model.id())
263    }
264
265    fn max_token_count(&self) -> u64 {
266        self.model.max_token_count()
267    }
268
269    fn max_output_tokens(&self) -> Option<u64> {
270        self.model.max_output_tokens()
271    }
272
273    fn count_tokens(
274        &self,
275        request: LanguageModelRequest,
276        cx: &App,
277    ) -> BoxFuture<'static, Result<u64>> {
278        cx.background_spawn(async move {
279            let messages = request
280                .messages
281                .into_iter()
282                .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
283                    role: match message.role {
284                        Role::User => "user".into(),
285                        Role::Assistant => "assistant".into(),
286                        Role::System => "system".into(),
287                    },
288                    content: Some(message.string_contents()),
289                    name: None,
290                    function_call: None,
291                })
292                .collect::<Vec<_>>();
293
294            tiktoken_rs::num_tokens_from_messages("gpt-4", &messages).map(|tokens| tokens as u64)
295        })
296        .boxed()
297    }
298
299    fn stream_completion(
300        &self,
301        request: LanguageModelRequest,
302        cx: &AsyncApp,
303    ) -> BoxFuture<
304        'static,
305        Result<
306            BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
307            LanguageModelCompletionError,
308        >,
309    > {
310        let request = into_deepseek(request, &self.model, self.max_output_tokens());
311        let stream = self.stream_completion(request, cx);
312
313        async move {
314            let mapper = DeepSeekEventMapper::new();
315            Ok(mapper.map_stream(stream.await?).boxed())
316        }
317        .boxed()
318    }
319}
320
321pub fn into_deepseek(
322    request: LanguageModelRequest,
323    model: &deepseek::Model,
324    max_output_tokens: Option<u64>,
325) -> deepseek::Request {
326    let is_reasoner = model == &deepseek::Model::Reasoner;
327
328    let mut messages = Vec::new();
329    let mut current_reasoning: Option<String> = None;
330
331    for message in request.messages {
332        for content in message.content {
333            match content {
334                MessageContent::Text(text) => messages.push(match message.role {
335                    Role::User => deepseek::RequestMessage::User { content: text },
336                    Role::Assistant => deepseek::RequestMessage::Assistant {
337                        content: Some(text),
338                        tool_calls: Vec::new(),
339                        reasoning_content: current_reasoning.take(),
340                    },
341                    Role::System => deepseek::RequestMessage::System { content: text },
342                }),
343                MessageContent::Thinking { text, .. } => {
344                    // Accumulate reasoning content for next assistant message
345                    current_reasoning.get_or_insert_default().push_str(&text);
346                }
347                MessageContent::RedactedThinking(_) => {}
348                MessageContent::Image(_) => {}
349                MessageContent::ToolUse(tool_use) => {
350                    let tool_call = deepseek::ToolCall {
351                        id: tool_use.id.to_string(),
352                        content: deepseek::ToolCallContent::Function {
353                            function: deepseek::FunctionContent {
354                                name: tool_use.name.to_string(),
355                                arguments: serde_json::to_string(&tool_use.input)
356                                    .unwrap_or_default(),
357                            },
358                        },
359                    };
360
361                    if let Some(deepseek::RequestMessage::Assistant { tool_calls, .. }) =
362                        messages.last_mut()
363                    {
364                        tool_calls.push(tool_call);
365                    } else {
366                        messages.push(deepseek::RequestMessage::Assistant {
367                            content: None,
368                            tool_calls: vec![tool_call],
369                            reasoning_content: current_reasoning.take(),
370                        });
371                    }
372                }
373                MessageContent::ToolResult(tool_result) => {
374                    match &tool_result.content {
375                        LanguageModelToolResultContent::Text(text) => {
376                            messages.push(deepseek::RequestMessage::Tool {
377                                content: text.to_string(),
378                                tool_call_id: tool_result.tool_use_id.to_string(),
379                            });
380                        }
381                        LanguageModelToolResultContent::Image(_) => {}
382                    };
383                }
384            }
385        }
386    }
387
388    deepseek::Request {
389        model: model.id().to_string(),
390        messages,
391        stream: true,
392        max_tokens: max_output_tokens,
393        temperature: if is_reasoner {
394            None
395        } else {
396            request.temperature
397        },
398        response_format: None,
399        tools: request
400            .tools
401            .into_iter()
402            .map(|tool| deepseek::ToolDefinition::Function {
403                function: deepseek::FunctionDefinition {
404                    name: tool.name,
405                    description: Some(tool.description),
406                    parameters: Some(tool.input_schema),
407                },
408            })
409            .collect(),
410    }
411}
412
413pub struct DeepSeekEventMapper {
414    tool_calls_by_index: HashMap<usize, RawToolCall>,
415}
416
417impl DeepSeekEventMapper {
418    pub fn new() -> Self {
419        Self {
420            tool_calls_by_index: HashMap::default(),
421        }
422    }
423
424    pub fn map_stream(
425        mut self,
426        events: Pin<Box<dyn Send + Stream<Item = Result<deepseek::StreamResponse>>>>,
427    ) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>
428    {
429        events.flat_map(move |event| {
430            futures::stream::iter(match event {
431                Ok(event) => self.map_event(event),
432                Err(error) => vec![Err(LanguageModelCompletionError::from(error))],
433            })
434        })
435    }
436
437    pub fn map_event(
438        &mut self,
439        event: deepseek::StreamResponse,
440    ) -> Vec<Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
441        let Some(choice) = event.choices.first() else {
442            return vec![Err(LanguageModelCompletionError::from(anyhow!(
443                "Response contained no choices"
444            )))];
445        };
446
447        let mut events = Vec::new();
448        if let Some(content) = choice.delta.content.clone() {
449            events.push(Ok(LanguageModelCompletionEvent::Text(content)));
450        }
451
452        if let Some(reasoning_content) = choice.delta.reasoning_content.clone() {
453            events.push(Ok(LanguageModelCompletionEvent::Thinking {
454                text: reasoning_content,
455                signature: None,
456            }));
457        }
458
459        if let Some(tool_calls) = choice.delta.tool_calls.as_ref() {
460            for tool_call in tool_calls {
461                let entry = self.tool_calls_by_index.entry(tool_call.index).or_default();
462
463                if let Some(tool_id) = tool_call.id.clone() {
464                    entry.id = tool_id;
465                }
466
467                if let Some(function) = tool_call.function.as_ref() {
468                    if let Some(name) = function.name.clone() {
469                        entry.name = name;
470                    }
471
472                    if let Some(arguments) = function.arguments.clone() {
473                        entry.arguments.push_str(&arguments);
474                    }
475                }
476
477                if !entry.id.is_empty() && !entry.name.is_empty() {
478                    if let Ok(input) = serde_json::from_str::<serde_json::Value>(
479                        &partial_json_fixer::fix_json(&entry.arguments),
480                    ) {
481                        events.push(Ok(LanguageModelCompletionEvent::ToolUse(
482                            LanguageModelToolUse {
483                                id: entry.id.clone().into(),
484                                name: entry.name.as_str().into(),
485                                is_input_complete: false,
486                                input,
487                                raw_input: entry.arguments.clone(),
488                                thought_signature: None,
489                            },
490                        )));
491                    }
492                }
493            }
494        }
495
496        if let Some(usage) = event.usage {
497            events.push(Ok(LanguageModelCompletionEvent::UsageUpdate(TokenUsage {
498                input_tokens: usage.prompt_tokens,
499                output_tokens: usage.completion_tokens,
500                cache_creation_input_tokens: 0,
501                cache_read_input_tokens: 0,
502            })));
503        }
504
505        match choice.finish_reason.as_deref() {
506            Some("stop") => {
507                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
508            }
509            Some("tool_calls") => {
510                events.extend(self.tool_calls_by_index.drain().map(|(_, tool_call)| {
511                    match parse_tool_arguments(&tool_call.arguments) {
512                        Ok(input) => Ok(LanguageModelCompletionEvent::ToolUse(
513                            LanguageModelToolUse {
514                                id: tool_call.id.clone().into(),
515                                name: tool_call.name.as_str().into(),
516                                is_input_complete: true,
517                                input,
518                                raw_input: tool_call.arguments.clone(),
519                                thought_signature: None,
520                            },
521                        )),
522                        Err(error) => Ok(LanguageModelCompletionEvent::ToolUseJsonParseError {
523                            id: tool_call.id.clone().into(),
524                            tool_name: tool_call.name.as_str().into(),
525                            raw_input: tool_call.arguments.into(),
526                            json_parse_error: error.to_string(),
527                        }),
528                    }
529                }));
530
531                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::ToolUse)));
532            }
533            Some(stop_reason) => {
534                log::error!("Unexpected DeepSeek stop_reason: {stop_reason:?}",);
535                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
536            }
537            None => {}
538        }
539
540        events
541    }
542}
543
544struct ConfigurationView {
545    api_key_editor: Entity<InputField>,
546    state: Entity<State>,
547    load_credentials_task: Option<Task<()>>,
548}
549
550impl ConfigurationView {
551    fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
552        let api_key_editor =
553            cx.new(|cx| InputField::new(window, cx, "sk-00000000000000000000000000000000"));
554
555        cx.observe(&state, |_, _, cx| {
556            cx.notify();
557        })
558        .detach();
559
560        let load_credentials_task = Some(cx.spawn({
561            let state = state.clone();
562            async move |this, cx| {
563                if let Some(task) = Some(state.update(cx, |state, cx| state.authenticate(cx))) {
564                    let _ = task.await;
565                }
566
567                this.update(cx, |this, cx| {
568                    this.load_credentials_task = None;
569                    cx.notify();
570                })
571                .log_err();
572            }
573        }));
574
575        Self {
576            api_key_editor,
577            state,
578            load_credentials_task,
579        }
580    }
581
582    fn save_api_key(&mut self, _: &menu::Confirm, _window: &mut Window, cx: &mut Context<Self>) {
583        let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
584        if api_key.is_empty() {
585            return;
586        }
587
588        let state = self.state.clone();
589        cx.spawn(async move |_, cx| {
590            state
591                .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))
592                .await
593        })
594        .detach_and_log_err(cx);
595    }
596
597    fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
598        self.api_key_editor
599            .update(cx, |editor, cx| editor.set_text("", window, cx));
600
601        let state = self.state.clone();
602        cx.spawn(async move |_, cx| {
603            state
604                .update(cx, |state, cx| state.set_api_key(None, cx))
605                .await
606        })
607        .detach_and_log_err(cx);
608    }
609
610    fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
611        !self.state.read(cx).is_authenticated()
612    }
613}
614
615impl Render for ConfigurationView {
616    fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
617        let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
618        let configured_card_label = if env_var_set {
619            format!("API key set in {API_KEY_ENV_VAR_NAME} environment variable")
620        } else {
621            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
622            if api_url == DEEPSEEK_API_URL {
623                "API key configured".to_string()
624            } else {
625                format!("API key configured for {}", api_url)
626            }
627        };
628
629        if self.load_credentials_task.is_some() {
630            div()
631                .child(Label::new("Loading credentials..."))
632                .into_any_element()
633        } else if self.should_render_editor(cx) {
634            v_flex()
635                .size_full()
636                .on_action(cx.listener(Self::save_api_key))
637                .child(Label::new("To use DeepSeek in Zed, you need an API key:"))
638                .child(
639                    List::new()
640                        .child(
641                            ListBulletItem::new("")
642                                .child(Label::new("Get your API key from the"))
643                                .child(ButtonLink::new(
644                                    "DeepSeek console",
645                                    "https://platform.deepseek.com/api_keys",
646                                )),
647                        )
648                        .child(ListBulletItem::new(
649                            "Paste your API key below and hit enter to start using the assistant",
650                        )),
651                )
652                .child(self.api_key_editor.clone())
653                .child(
654                    Label::new(format!(
655                        "You can also set the {API_KEY_ENV_VAR_NAME} environment variable and restart Zed."
656                    ))
657                    .size(LabelSize::Small)
658                    .color(Color::Muted),
659                )
660                .into_any_element()
661        } else {
662            ConfiguredApiCard::new(configured_card_label)
663                .disabled(env_var_set)
664                .on_click(cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)))
665                .into_any_element()
666        }
667    }
668}