deepseek.rs

  1use anyhow::{Result, anyhow};
  2use collections::{BTreeMap, HashMap};
  3use deepseek::DEEPSEEK_API_URL;
  4use editor::{Editor, EditorElement, EditorStyle};
  5use futures::Stream;
  6use futures::{FutureExt, StreamExt, future, future::BoxFuture, stream::BoxStream};
  7use gpui::{
  8    AnyView, App, AsyncApp, Context, Entity, FontStyle, SharedString, Task, TextStyle, WhiteSpace,
  9    Window,
 10};
 11use http_client::HttpClient;
 12use language_model::{
 13    AuthenticateError, LanguageModel, LanguageModelCompletionError, LanguageModelCompletionEvent,
 14    LanguageModelId, LanguageModelName, LanguageModelProvider, LanguageModelProviderId,
 15    LanguageModelProviderName, LanguageModelProviderState, LanguageModelRequest,
 16    LanguageModelToolChoice, LanguageModelToolResultContent, LanguageModelToolUse, MessageContent,
 17    RateLimiter, Role, StopReason, TokenUsage,
 18};
 19pub use settings::DeepseekAvailableModel as AvailableModel;
 20use settings::{Settings, SettingsStore};
 21use std::pin::Pin;
 22use std::str::FromStr;
 23use std::sync::{Arc, LazyLock};
 24use theme::ThemeSettings;
 25use ui::{Icon, IconName, List, prelude::*};
 26use util::{ResultExt, truncate_and_trailoff};
 27use zed_env_vars::{EnvVar, env_var};
 28
 29use crate::{api_key::ApiKeyState, ui::InstructionListItem};
 30
 31const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("deepseek");
 32const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("DeepSeek");
 33
 34const API_KEY_ENV_VAR_NAME: &str = "DEEPSEEK_API_KEY";
 35static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
 36
 37#[derive(Default)]
 38struct RawToolCall {
 39    id: String,
 40    name: String,
 41    arguments: String,
 42}
 43
 44#[derive(Default, Clone, Debug, PartialEq)]
 45pub struct DeepSeekSettings {
 46    pub api_url: String,
 47    pub available_models: Vec<AvailableModel>,
 48}
 49pub struct DeepSeekLanguageModelProvider {
 50    http_client: Arc<dyn HttpClient>,
 51    state: Entity<State>,
 52}
 53
 54pub struct State {
 55    api_key_state: ApiKeyState,
 56}
 57
 58impl State {
 59    fn is_authenticated(&self) -> bool {
 60        self.api_key_state.has_key()
 61    }
 62
 63    fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
 64        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 65        self.api_key_state
 66            .store(api_url, api_key, |this| &mut this.api_key_state, cx)
 67    }
 68
 69    fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
 70        let api_url = DeepSeekLanguageModelProvider::api_url(cx);
 71        self.api_key_state.load_if_needed(
 72            api_url,
 73            &API_KEY_ENV_VAR,
 74            |this| &mut this.api_key_state,
 75            cx,
 76        )
 77    }
 78}
 79
 80impl DeepSeekLanguageModelProvider {
 81    pub fn new(http_client: Arc<dyn HttpClient>, cx: &mut App) -> Self {
 82        let state = cx.new(|cx| {
 83            cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
 84                let api_url = Self::api_url(cx);
 85                this.api_key_state.handle_url_change(
 86                    api_url,
 87                    &API_KEY_ENV_VAR,
 88                    |this| &mut this.api_key_state,
 89                    cx,
 90                );
 91                cx.notify();
 92            })
 93            .detach();
 94            State {
 95                api_key_state: ApiKeyState::new(Self::api_url(cx)),
 96            }
 97        });
 98
 99        Self { http_client, state }
100    }
101
102    fn create_language_model(&self, model: deepseek::Model) -> Arc<dyn LanguageModel> {
103        Arc::new(DeepSeekLanguageModel {
104            id: LanguageModelId::from(model.id().to_string()),
105            model,
106            state: self.state.clone(),
107            http_client: self.http_client.clone(),
108            request_limiter: RateLimiter::new(4),
109        })
110    }
111
112    fn settings(cx: &App) -> &DeepSeekSettings {
113        &crate::AllLanguageModelSettings::get_global(cx).deepseek
114    }
115
116    fn api_url(cx: &App) -> SharedString {
117        let api_url = &Self::settings(cx).api_url;
118        if api_url.is_empty() {
119            DEEPSEEK_API_URL.into()
120        } else {
121            SharedString::new(api_url.as_str())
122        }
123    }
124}
125
126impl LanguageModelProviderState for DeepSeekLanguageModelProvider {
127    type ObservableEntity = State;
128
129    fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
130        Some(self.state.clone())
131    }
132}
133
134impl LanguageModelProvider for DeepSeekLanguageModelProvider {
135    fn id(&self) -> LanguageModelProviderId {
136        PROVIDER_ID
137    }
138
139    fn name(&self) -> LanguageModelProviderName {
140        PROVIDER_NAME
141    }
142
143    fn icon(&self) -> IconName {
144        IconName::AiDeepSeek
145    }
146
147    fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
148        Some(self.create_language_model(deepseek::Model::default()))
149    }
150
151    fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
152        Some(self.create_language_model(deepseek::Model::default_fast()))
153    }
154
155    fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
156        let mut models = BTreeMap::default();
157
158        models.insert("deepseek-chat", deepseek::Model::Chat);
159        models.insert("deepseek-reasoner", deepseek::Model::Reasoner);
160
161        for available_model in &Self::settings(cx).available_models {
162            models.insert(
163                &available_model.name,
164                deepseek::Model::Custom {
165                    name: available_model.name.clone(),
166                    display_name: available_model.display_name.clone(),
167                    max_tokens: available_model.max_tokens,
168                    max_output_tokens: available_model.max_output_tokens,
169                },
170            );
171        }
172
173        models
174            .into_values()
175            .map(|model| self.create_language_model(model))
176            .collect()
177    }
178
179    fn is_authenticated(&self, cx: &App) -> bool {
180        self.state.read(cx).is_authenticated()
181    }
182
183    fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
184        self.state.update(cx, |state, cx| state.authenticate(cx))
185    }
186
187    fn configuration_view(
188        &self,
189        _target_agent: language_model::ConfigurationViewTargetAgent,
190        window: &mut Window,
191        cx: &mut App,
192    ) -> AnyView {
193        cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
194            .into()
195    }
196
197    fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
198        self.state
199            .update(cx, |state, cx| state.set_api_key(None, cx))
200    }
201}
202
203pub struct DeepSeekLanguageModel {
204    id: LanguageModelId,
205    model: deepseek::Model,
206    state: Entity<State>,
207    http_client: Arc<dyn HttpClient>,
208    request_limiter: RateLimiter,
209}
210
211impl DeepSeekLanguageModel {
212    fn stream_completion(
213        &self,
214        request: deepseek::Request,
215        cx: &AsyncApp,
216    ) -> BoxFuture<'static, Result<BoxStream<'static, Result<deepseek::StreamResponse>>>> {
217        let http_client = self.http_client.clone();
218
219        let Ok((api_key, api_url)) = self.state.read_with(cx, |state, cx| {
220            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
221            (state.api_key_state.key(&api_url), api_url)
222        }) else {
223            return future::ready(Err(anyhow!("App state dropped"))).boxed();
224        };
225
226        let future = self.request_limiter.stream(async move {
227            let Some(api_key) = api_key else {
228                return Err(LanguageModelCompletionError::NoApiKey {
229                    provider: PROVIDER_NAME,
230                });
231            };
232            let request =
233                deepseek::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
234            let response = request.await?;
235            Ok(response)
236        });
237
238        async move { Ok(future.await?.boxed()) }.boxed()
239    }
240}
241
242impl LanguageModel for DeepSeekLanguageModel {
243    fn id(&self) -> LanguageModelId {
244        self.id.clone()
245    }
246
247    fn name(&self) -> LanguageModelName {
248        LanguageModelName::from(self.model.display_name().to_string())
249    }
250
251    fn provider_id(&self) -> LanguageModelProviderId {
252        PROVIDER_ID
253    }
254
255    fn provider_name(&self) -> LanguageModelProviderName {
256        PROVIDER_NAME
257    }
258
259    fn supports_tools(&self) -> bool {
260        true
261    }
262
263    fn supports_tool_choice(&self, _choice: LanguageModelToolChoice) -> bool {
264        true
265    }
266
267    fn supports_images(&self) -> bool {
268        false
269    }
270
271    fn telemetry_id(&self) -> String {
272        format!("deepseek/{}", self.model.id())
273    }
274
275    fn max_token_count(&self) -> u64 {
276        self.model.max_token_count()
277    }
278
279    fn max_output_tokens(&self) -> Option<u64> {
280        self.model.max_output_tokens()
281    }
282
283    fn count_tokens(
284        &self,
285        request: LanguageModelRequest,
286        cx: &App,
287    ) -> BoxFuture<'static, Result<u64>> {
288        cx.background_spawn(async move {
289            let messages = request
290                .messages
291                .into_iter()
292                .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
293                    role: match message.role {
294                        Role::User => "user".into(),
295                        Role::Assistant => "assistant".into(),
296                        Role::System => "system".into(),
297                    },
298                    content: Some(message.string_contents()),
299                    name: None,
300                    function_call: None,
301                })
302                .collect::<Vec<_>>();
303
304            tiktoken_rs::num_tokens_from_messages("gpt-4", &messages).map(|tokens| tokens as u64)
305        })
306        .boxed()
307    }
308
309    fn stream_completion(
310        &self,
311        request: LanguageModelRequest,
312        cx: &AsyncApp,
313    ) -> BoxFuture<
314        'static,
315        Result<
316            BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
317            LanguageModelCompletionError,
318        >,
319    > {
320        let request = into_deepseek(request, &self.model, self.max_output_tokens());
321        let stream = self.stream_completion(request, cx);
322
323        async move {
324            let mapper = DeepSeekEventMapper::new();
325            Ok(mapper.map_stream(stream.await?).boxed())
326        }
327        .boxed()
328    }
329}
330
331pub fn into_deepseek(
332    request: LanguageModelRequest,
333    model: &deepseek::Model,
334    max_output_tokens: Option<u64>,
335) -> deepseek::Request {
336    let is_reasoner = *model == deepseek::Model::Reasoner;
337
338    let mut messages = Vec::new();
339    for message in request.messages {
340        for content in message.content {
341            match content {
342                MessageContent::Text(text) => messages.push(match message.role {
343                    Role::User => deepseek::RequestMessage::User { content: text },
344                    Role::Assistant => deepseek::RequestMessage::Assistant {
345                        content: Some(text),
346                        tool_calls: Vec::new(),
347                    },
348                    Role::System => deepseek::RequestMessage::System { content: text },
349                }),
350                MessageContent::Thinking { .. } => {}
351                MessageContent::RedactedThinking(_) => {}
352                MessageContent::Image(_) => {}
353                MessageContent::ToolUse(tool_use) => {
354                    let tool_call = deepseek::ToolCall {
355                        id: tool_use.id.to_string(),
356                        content: deepseek::ToolCallContent::Function {
357                            function: deepseek::FunctionContent {
358                                name: tool_use.name.to_string(),
359                                arguments: serde_json::to_string(&tool_use.input)
360                                    .unwrap_or_default(),
361                            },
362                        },
363                    };
364
365                    if let Some(deepseek::RequestMessage::Assistant { tool_calls, .. }) =
366                        messages.last_mut()
367                    {
368                        tool_calls.push(tool_call);
369                    } else {
370                        messages.push(deepseek::RequestMessage::Assistant {
371                            content: None,
372                            tool_calls: vec![tool_call],
373                        });
374                    }
375                }
376                MessageContent::ToolResult(tool_result) => {
377                    match &tool_result.content {
378                        LanguageModelToolResultContent::Text(text) => {
379                            messages.push(deepseek::RequestMessage::Tool {
380                                content: text.to_string(),
381                                tool_call_id: tool_result.tool_use_id.to_string(),
382                            });
383                        }
384                        LanguageModelToolResultContent::Image(_) => {}
385                    };
386                }
387            }
388        }
389    }
390
391    deepseek::Request {
392        model: model.id().to_string(),
393        messages,
394        stream: true,
395        max_tokens: max_output_tokens,
396        temperature: if is_reasoner {
397            None
398        } else {
399            request.temperature
400        },
401        response_format: None,
402        tools: request
403            .tools
404            .into_iter()
405            .map(|tool| deepseek::ToolDefinition::Function {
406                function: deepseek::FunctionDefinition {
407                    name: tool.name,
408                    description: Some(tool.description),
409                    parameters: Some(tool.input_schema),
410                },
411            })
412            .collect(),
413    }
414}
415
416pub struct DeepSeekEventMapper {
417    tool_calls_by_index: HashMap<usize, RawToolCall>,
418}
419
420impl DeepSeekEventMapper {
421    pub fn new() -> Self {
422        Self {
423            tool_calls_by_index: HashMap::default(),
424        }
425    }
426
427    pub fn map_stream(
428        mut self,
429        events: Pin<Box<dyn Send + Stream<Item = Result<deepseek::StreamResponse>>>>,
430    ) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>
431    {
432        events.flat_map(move |event| {
433            futures::stream::iter(match event {
434                Ok(event) => self.map_event(event),
435                Err(error) => vec![Err(LanguageModelCompletionError::from(error))],
436            })
437        })
438    }
439
440    pub fn map_event(
441        &mut self,
442        event: deepseek::StreamResponse,
443    ) -> Vec<Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
444        let Some(choice) = event.choices.first() else {
445            return vec![Err(LanguageModelCompletionError::from(anyhow!(
446                "Response contained no choices"
447            )))];
448        };
449
450        let mut events = Vec::new();
451        if let Some(content) = choice.delta.content.clone() {
452            events.push(Ok(LanguageModelCompletionEvent::Text(content)));
453        }
454
455        if let Some(reasoning_content) = choice.delta.reasoning_content.clone() {
456            events.push(Ok(LanguageModelCompletionEvent::Thinking {
457                text: reasoning_content,
458                signature: None,
459            }));
460        }
461
462        if let Some(tool_calls) = choice.delta.tool_calls.as_ref() {
463            for tool_call in tool_calls {
464                let entry = self.tool_calls_by_index.entry(tool_call.index).or_default();
465
466                if let Some(tool_id) = tool_call.id.clone() {
467                    entry.id = tool_id;
468                }
469
470                if let Some(function) = tool_call.function.as_ref() {
471                    if let Some(name) = function.name.clone() {
472                        entry.name = name;
473                    }
474
475                    if let Some(arguments) = function.arguments.clone() {
476                        entry.arguments.push_str(&arguments);
477                    }
478                }
479            }
480        }
481
482        if let Some(usage) = event.usage {
483            events.push(Ok(LanguageModelCompletionEvent::UsageUpdate(TokenUsage {
484                input_tokens: usage.prompt_tokens,
485                output_tokens: usage.completion_tokens,
486                cache_creation_input_tokens: 0,
487                cache_read_input_tokens: 0,
488            })));
489        }
490
491        match choice.finish_reason.as_deref() {
492            Some("stop") => {
493                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
494            }
495            Some("tool_calls") => {
496                events.extend(self.tool_calls_by_index.drain().map(|(_, tool_call)| {
497                    match serde_json::Value::from_str(&tool_call.arguments) {
498                        Ok(input) => Ok(LanguageModelCompletionEvent::ToolUse(
499                            LanguageModelToolUse {
500                                id: tool_call.id.clone().into(),
501                                name: tool_call.name.as_str().into(),
502                                is_input_complete: true,
503                                input,
504                                raw_input: tool_call.arguments.clone(),
505                            },
506                        )),
507                        Err(error) => Ok(LanguageModelCompletionEvent::ToolUseJsonParseError {
508                            id: tool_call.id.clone().into(),
509                            tool_name: tool_call.name.as_str().into(),
510                            raw_input: tool_call.arguments.into(),
511                            json_parse_error: error.to_string(),
512                        }),
513                    }
514                }));
515
516                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::ToolUse)));
517            }
518            Some(stop_reason) => {
519                log::error!("Unexpected DeepSeek stop_reason: {stop_reason:?}",);
520                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
521            }
522            None => {}
523        }
524
525        events
526    }
527}
528
529struct ConfigurationView {
530    api_key_editor: Entity<Editor>,
531    state: Entity<State>,
532    load_credentials_task: Option<Task<()>>,
533}
534
535impl ConfigurationView {
536    fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
537        let api_key_editor = cx.new(|cx| {
538            let mut editor = Editor::single_line(window, cx);
539            editor.set_placeholder_text("sk-00000000000000000000000000000000", window, cx);
540            editor
541        });
542
543        cx.observe(&state, |_, _, cx| {
544            cx.notify();
545        })
546        .detach();
547
548        let load_credentials_task = Some(cx.spawn({
549            let state = state.clone();
550            async move |this, cx| {
551                if let Some(task) = state
552                    .update(cx, |state, cx| state.authenticate(cx))
553                    .log_err()
554                {
555                    let _ = task.await;
556                }
557
558                this.update(cx, |this, cx| {
559                    this.load_credentials_task = None;
560                    cx.notify();
561                })
562                .log_err();
563            }
564        }));
565
566        Self {
567            api_key_editor,
568            state,
569            load_credentials_task,
570        }
571    }
572
573    fn save_api_key(&mut self, _: &menu::Confirm, _window: &mut Window, cx: &mut Context<Self>) {
574        let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
575        if api_key.is_empty() {
576            return;
577        }
578
579        let state = self.state.clone();
580        cx.spawn(async move |_, cx| {
581            state
582                .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))?
583                .await
584        })
585        .detach_and_log_err(cx);
586    }
587
588    fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
589        self.api_key_editor
590            .update(cx, |editor, cx| editor.set_text("", window, cx));
591
592        let state = self.state.clone();
593        cx.spawn(async move |_, cx| {
594            state
595                .update(cx, |state, cx| state.set_api_key(None, cx))?
596                .await
597        })
598        .detach_and_log_err(cx);
599    }
600
601    fn render_api_key_editor(&self, cx: &mut Context<Self>) -> impl IntoElement {
602        let settings = ThemeSettings::get_global(cx);
603        let text_style = TextStyle {
604            color: cx.theme().colors().text,
605            font_family: settings.ui_font.family.clone(),
606            font_features: settings.ui_font.features.clone(),
607            font_fallbacks: settings.ui_font.fallbacks.clone(),
608            font_size: rems(0.875).into(),
609            font_weight: settings.ui_font.weight,
610            font_style: FontStyle::Normal,
611            line_height: relative(1.3),
612            background_color: None,
613            underline: None,
614            strikethrough: None,
615            white_space: WhiteSpace::Normal,
616            ..Default::default()
617        };
618        EditorElement::new(
619            &self.api_key_editor,
620            EditorStyle {
621                background: cx.theme().colors().editor_background,
622                local_player: cx.theme().players().local(),
623                text: text_style,
624                ..Default::default()
625            },
626        )
627    }
628
629    fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
630        !self.state.read(cx).is_authenticated()
631    }
632}
633
634impl Render for ConfigurationView {
635    fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
636        let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
637
638        if self.load_credentials_task.is_some() {
639            div().child(Label::new("Loading credentials...")).into_any()
640        } else if self.should_render_editor(cx) {
641            v_flex()
642                .size_full()
643                .on_action(cx.listener(Self::save_api_key))
644                .child(Label::new("To use DeepSeek in Zed, you need an API key:"))
645                .child(
646                    List::new()
647                        .child(InstructionListItem::new(
648                            "Get your API key from the",
649                            Some("DeepSeek console"),
650                            Some("https://platform.deepseek.com/api_keys"),
651                        ))
652                        .child(InstructionListItem::text_only(
653                            "Paste your API key below and hit enter to start using the assistant",
654                        )),
655                )
656                .child(
657                    h_flex()
658                        .w_full()
659                        .my_2()
660                        .px_2()
661                        .py_1()
662                        .bg(cx.theme().colors().editor_background)
663                        .border_1()
664                        .border_color(cx.theme().colors().border)
665                        .rounded_sm()
666                        .child(self.render_api_key_editor(cx)),
667                )
668                .child(
669                    Label::new(format!(
670                        "Or set the {API_KEY_ENV_VAR_NAME} environment variable."
671                    ))
672                    .size(LabelSize::Small)
673                    .color(Color::Muted),
674                )
675                .into_any()
676        } else {
677            h_flex()
678                .mt_1()
679                .p_1()
680                .justify_between()
681                .rounded_md()
682                .border_1()
683                .border_color(cx.theme().colors().border)
684                .bg(cx.theme().colors().background)
685                .child(
686                    h_flex()
687                        .gap_1()
688                        .child(Icon::new(IconName::Check).color(Color::Success))
689                        .child(Label::new(if env_var_set {
690                            format!("API key set in {API_KEY_ENV_VAR_NAME} environment variable")
691                        } else {
692                            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
693                            if api_url == DEEPSEEK_API_URL {
694                                "API key configured".to_string()
695                            } else {
696                                format!(
697                                    "API key configured for {}",
698                                    truncate_and_trailoff(&api_url, 32)
699                                )
700                            }
701                        })),
702                )
703                .child(
704                    Button::new("reset-key", "Reset Key")
705                        .label_size(LabelSize::Small)
706                        .icon(Some(IconName::Trash))
707                        .icon_size(IconSize::Small)
708                        .icon_position(IconPosition::Start)
709                        .disabled(env_var_set)
710                        .on_click(
711                            cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)),
712                        ),
713                )
714                .into_any()
715        }
716    }
717}