deepseek.rs

  1use anyhow::{Result, anyhow};
  2use collections::{BTreeMap, HashMap};
  3use editor::{Editor, EditorElement, EditorStyle};
  4use futures::Stream;
  5use futures::{FutureExt, StreamExt, future, future::BoxFuture, stream::BoxStream};
  6use gpui::{
  7    AnyView, App, AsyncApp, Context, Entity, FontStyle, SharedString, Task, TextStyle, WhiteSpace,
  8    Window,
  9};
 10use http_client::HttpClient;
 11use language_model::{
 12    AuthenticateError, LanguageModel, LanguageModelCompletionError, LanguageModelCompletionEvent,
 13    LanguageModelId, LanguageModelName, LanguageModelProvider, LanguageModelProviderId,
 14    LanguageModelProviderName, LanguageModelProviderState, LanguageModelRequest,
 15    LanguageModelToolChoice, LanguageModelToolResultContent, LanguageModelToolUse, MessageContent,
 16    RateLimiter, Role, StopReason, TokenUsage,
 17};
 18use schemars::JsonSchema;
 19use serde::{Deserialize, Serialize};
 20use settings::{Settings, SettingsStore};
 21use std::pin::Pin;
 22use std::str::FromStr;
 23use std::sync::{Arc, LazyLock};
 24use theme::ThemeSettings;
 25use ui::{Icon, IconName, List, prelude::*};
 26use util::ResultExt;
 27use zed_env_vars::{EnvVar, env_var};
 28
 29use crate::{api_key::ApiKeyState, ui::InstructionListItem};
 30
 31const PROVIDER_ID: LanguageModelProviderId = LanguageModelProviderId::new("deepseek");
 32const PROVIDER_NAME: LanguageModelProviderName = LanguageModelProviderName::new("DeepSeek");
 33
 34const API_KEY_ENV_VAR_NAME: &str = "DEEPSEEK_API_KEY";
 35static API_KEY_ENV_VAR: LazyLock<EnvVar> = env_var!(API_KEY_ENV_VAR_NAME);
 36
 37#[derive(Default)]
 38struct RawToolCall {
 39    id: String,
 40    name: String,
 41    arguments: String,
 42}
 43
 44#[derive(Default, Clone, Debug, PartialEq)]
 45pub struct DeepSeekSettings {
 46    pub api_url: String,
 47    pub available_models: Vec<AvailableModel>,
 48}
 49
 50#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, JsonSchema)]
 51pub struct AvailableModel {
 52    pub name: String,
 53    pub display_name: Option<String>,
 54    pub max_tokens: u64,
 55    pub max_output_tokens: Option<u64>,
 56}
 57
 58pub struct DeepSeekLanguageModelProvider {
 59    http_client: Arc<dyn HttpClient>,
 60    state: Entity<State>,
 61}
 62
 63pub struct State {
 64    api_key_state: ApiKeyState,
 65}
 66
 67impl State {
 68    fn is_authenticated(&self) -> bool {
 69        self.api_key_state.has_key()
 70    }
 71
 72    fn set_api_key(&mut self, api_key: Option<String>, cx: &mut Context<Self>) -> Task<Result<()>> {
 73        let api_url = SharedString::new(DeepSeekLanguageModelProvider::api_url(cx));
 74        self.api_key_state
 75            .store(api_url, api_key, |this| &mut this.api_key_state, cx)
 76    }
 77
 78    fn authenticate(&mut self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
 79        let api_url = SharedString::new(DeepSeekLanguageModelProvider::api_url(cx));
 80        self.api_key_state.load_if_needed(
 81            api_url,
 82            &API_KEY_ENV_VAR,
 83            |this| &mut this.api_key_state,
 84            cx,
 85        )
 86    }
 87}
 88
 89impl DeepSeekLanguageModelProvider {
 90    pub fn new(http_client: Arc<dyn HttpClient>, cx: &mut App) -> Self {
 91        let state = cx.new(|cx| {
 92            cx.observe_global::<SettingsStore>(|this: &mut State, cx| {
 93                let api_url = SharedString::new(Self::api_url(cx));
 94                this.api_key_state.handle_url_change(
 95                    api_url,
 96                    &API_KEY_ENV_VAR,
 97                    |this| &mut this.api_key_state,
 98                    cx,
 99                );
100                cx.notify();
101            })
102            .detach();
103            State {
104                api_key_state: ApiKeyState::new(SharedString::new(Self::api_url(cx))),
105            }
106        });
107
108        Self { http_client, state }
109    }
110
111    fn create_language_model(&self, model: deepseek::Model) -> Arc<dyn LanguageModel> {
112        Arc::new(DeepSeekLanguageModel {
113            id: LanguageModelId::from(model.id().to_string()),
114            model,
115            state: self.state.clone(),
116            http_client: self.http_client.clone(),
117            request_limiter: RateLimiter::new(4),
118        })
119    }
120
121    fn settings(cx: &App) -> &DeepSeekSettings {
122        &crate::AllLanguageModelSettings::get_global(cx).deepseek
123    }
124
125    fn api_url(cx: &App) -> &str {
126        &Self::settings(cx).api_url
127    }
128}
129
130impl LanguageModelProviderState for DeepSeekLanguageModelProvider {
131    type ObservableEntity = State;
132
133    fn observable_entity(&self) -> Option<Entity<Self::ObservableEntity>> {
134        Some(self.state.clone())
135    }
136}
137
138impl LanguageModelProvider for DeepSeekLanguageModelProvider {
139    fn id(&self) -> LanguageModelProviderId {
140        PROVIDER_ID
141    }
142
143    fn name(&self) -> LanguageModelProviderName {
144        PROVIDER_NAME
145    }
146
147    fn icon(&self) -> IconName {
148        IconName::AiDeepSeek
149    }
150
151    fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
152        Some(self.create_language_model(deepseek::Model::default()))
153    }
154
155    fn default_fast_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
156        Some(self.create_language_model(deepseek::Model::default_fast()))
157    }
158
159    fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
160        let mut models = BTreeMap::default();
161
162        models.insert("deepseek-chat", deepseek::Model::Chat);
163        models.insert("deepseek-reasoner", deepseek::Model::Reasoner);
164
165        for available_model in &Self::settings(cx).available_models {
166            models.insert(
167                &available_model.name,
168                deepseek::Model::Custom {
169                    name: available_model.name.clone(),
170                    display_name: available_model.display_name.clone(),
171                    max_tokens: available_model.max_tokens,
172                    max_output_tokens: available_model.max_output_tokens,
173                },
174            );
175        }
176
177        models
178            .into_values()
179            .map(|model| self.create_language_model(model))
180            .collect()
181    }
182
183    fn is_authenticated(&self, cx: &App) -> bool {
184        self.state.read(cx).is_authenticated()
185    }
186
187    fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
188        self.state.update(cx, |state, cx| state.authenticate(cx))
189    }
190
191    fn configuration_view(
192        &self,
193        _target_agent: language_model::ConfigurationViewTargetAgent,
194        window: &mut Window,
195        cx: &mut App,
196    ) -> AnyView {
197        cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
198            .into()
199    }
200
201    fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
202        self.state
203            .update(cx, |state, cx| state.set_api_key(None, cx))
204    }
205}
206
207pub struct DeepSeekLanguageModel {
208    id: LanguageModelId,
209    model: deepseek::Model,
210    state: Entity<State>,
211    http_client: Arc<dyn HttpClient>,
212    request_limiter: RateLimiter,
213}
214
215impl DeepSeekLanguageModel {
216    fn stream_completion(
217        &self,
218        request: deepseek::Request,
219        cx: &AsyncApp,
220    ) -> BoxFuture<'static, Result<BoxStream<'static, Result<deepseek::StreamResponse>>>> {
221        let http_client = self.http_client.clone();
222
223        let Ok((api_key, api_url)) = self.state.read_with(cx, |state, cx| {
224            let api_url = DeepSeekLanguageModelProvider::api_url(cx);
225            (state.api_key_state.key(api_url), api_url.to_string())
226        }) else {
227            return future::ready(Err(anyhow!("App state dropped"))).boxed();
228        };
229
230        let future = self.request_limiter.stream(async move {
231            let Some(api_key) = api_key else {
232                return Err(LanguageModelCompletionError::NoApiKey {
233                    provider: PROVIDER_NAME,
234                });
235            };
236            let request =
237                deepseek::stream_completion(http_client.as_ref(), &api_url, &api_key, request);
238            let response = request.await?;
239            Ok(response)
240        });
241
242        async move { Ok(future.await?.boxed()) }.boxed()
243    }
244}
245
246impl LanguageModel for DeepSeekLanguageModel {
247    fn id(&self) -> LanguageModelId {
248        self.id.clone()
249    }
250
251    fn name(&self) -> LanguageModelName {
252        LanguageModelName::from(self.model.display_name().to_string())
253    }
254
255    fn provider_id(&self) -> LanguageModelProviderId {
256        PROVIDER_ID
257    }
258
259    fn provider_name(&self) -> LanguageModelProviderName {
260        PROVIDER_NAME
261    }
262
263    fn supports_tools(&self) -> bool {
264        true
265    }
266
267    fn supports_tool_choice(&self, _choice: LanguageModelToolChoice) -> bool {
268        true
269    }
270
271    fn supports_images(&self) -> bool {
272        false
273    }
274
275    fn telemetry_id(&self) -> String {
276        format!("deepseek/{}", self.model.id())
277    }
278
279    fn max_token_count(&self) -> u64 {
280        self.model.max_token_count()
281    }
282
283    fn max_output_tokens(&self) -> Option<u64> {
284        self.model.max_output_tokens()
285    }
286
287    fn count_tokens(
288        &self,
289        request: LanguageModelRequest,
290        cx: &App,
291    ) -> BoxFuture<'static, Result<u64>> {
292        cx.background_spawn(async move {
293            let messages = request
294                .messages
295                .into_iter()
296                .map(|message| tiktoken_rs::ChatCompletionRequestMessage {
297                    role: match message.role {
298                        Role::User => "user".into(),
299                        Role::Assistant => "assistant".into(),
300                        Role::System => "system".into(),
301                    },
302                    content: Some(message.string_contents()),
303                    name: None,
304                    function_call: None,
305                })
306                .collect::<Vec<_>>();
307
308            tiktoken_rs::num_tokens_from_messages("gpt-4", &messages).map(|tokens| tokens as u64)
309        })
310        .boxed()
311    }
312
313    fn stream_completion(
314        &self,
315        request: LanguageModelRequest,
316        cx: &AsyncApp,
317    ) -> BoxFuture<
318        'static,
319        Result<
320            BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
321            LanguageModelCompletionError,
322        >,
323    > {
324        let request = into_deepseek(request, &self.model, self.max_output_tokens());
325        let stream = self.stream_completion(request, cx);
326
327        async move {
328            let mapper = DeepSeekEventMapper::new();
329            Ok(mapper.map_stream(stream.await?).boxed())
330        }
331        .boxed()
332    }
333}
334
335pub fn into_deepseek(
336    request: LanguageModelRequest,
337    model: &deepseek::Model,
338    max_output_tokens: Option<u64>,
339) -> deepseek::Request {
340    let is_reasoner = *model == deepseek::Model::Reasoner;
341
342    let mut messages = Vec::new();
343    for message in request.messages {
344        for content in message.content {
345            match content {
346                MessageContent::Text(text) => messages.push(match message.role {
347                    Role::User => deepseek::RequestMessage::User { content: text },
348                    Role::Assistant => deepseek::RequestMessage::Assistant {
349                        content: Some(text),
350                        tool_calls: Vec::new(),
351                    },
352                    Role::System => deepseek::RequestMessage::System { content: text },
353                }),
354                MessageContent::Thinking { .. } => {}
355                MessageContent::RedactedThinking(_) => {}
356                MessageContent::Image(_) => {}
357                MessageContent::ToolUse(tool_use) => {
358                    let tool_call = deepseek::ToolCall {
359                        id: tool_use.id.to_string(),
360                        content: deepseek::ToolCallContent::Function {
361                            function: deepseek::FunctionContent {
362                                name: tool_use.name.to_string(),
363                                arguments: serde_json::to_string(&tool_use.input)
364                                    .unwrap_or_default(),
365                            },
366                        },
367                    };
368
369                    if let Some(deepseek::RequestMessage::Assistant { tool_calls, .. }) =
370                        messages.last_mut()
371                    {
372                        tool_calls.push(tool_call);
373                    } else {
374                        messages.push(deepseek::RequestMessage::Assistant {
375                            content: None,
376                            tool_calls: vec![tool_call],
377                        });
378                    }
379                }
380                MessageContent::ToolResult(tool_result) => {
381                    match &tool_result.content {
382                        LanguageModelToolResultContent::Text(text) => {
383                            messages.push(deepseek::RequestMessage::Tool {
384                                content: text.to_string(),
385                                tool_call_id: tool_result.tool_use_id.to_string(),
386                            });
387                        }
388                        LanguageModelToolResultContent::Image(_) => {}
389                    };
390                }
391            }
392        }
393    }
394
395    deepseek::Request {
396        model: model.id().to_string(),
397        messages,
398        stream: true,
399        max_tokens: max_output_tokens,
400        temperature: if is_reasoner {
401            None
402        } else {
403            request.temperature
404        },
405        response_format: None,
406        tools: request
407            .tools
408            .into_iter()
409            .map(|tool| deepseek::ToolDefinition::Function {
410                function: deepseek::FunctionDefinition {
411                    name: tool.name,
412                    description: Some(tool.description),
413                    parameters: Some(tool.input_schema),
414                },
415            })
416            .collect(),
417    }
418}
419
420pub struct DeepSeekEventMapper {
421    tool_calls_by_index: HashMap<usize, RawToolCall>,
422}
423
424impl DeepSeekEventMapper {
425    pub fn new() -> Self {
426        Self {
427            tool_calls_by_index: HashMap::default(),
428        }
429    }
430
431    pub fn map_stream(
432        mut self,
433        events: Pin<Box<dyn Send + Stream<Item = Result<deepseek::StreamResponse>>>>,
434    ) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>
435    {
436        events.flat_map(move |event| {
437            futures::stream::iter(match event {
438                Ok(event) => self.map_event(event),
439                Err(error) => vec![Err(LanguageModelCompletionError::from(error))],
440            })
441        })
442    }
443
444    pub fn map_event(
445        &mut self,
446        event: deepseek::StreamResponse,
447    ) -> Vec<Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
448        let Some(choice) = event.choices.first() else {
449            return vec![Err(LanguageModelCompletionError::from(anyhow!(
450                "Response contained no choices"
451            )))];
452        };
453
454        let mut events = Vec::new();
455        if let Some(content) = choice.delta.content.clone() {
456            events.push(Ok(LanguageModelCompletionEvent::Text(content)));
457        }
458
459        if let Some(reasoning_content) = choice.delta.reasoning_content.clone() {
460            events.push(Ok(LanguageModelCompletionEvent::Thinking {
461                text: reasoning_content,
462                signature: None,
463            }));
464        }
465
466        if let Some(tool_calls) = choice.delta.tool_calls.as_ref() {
467            for tool_call in tool_calls {
468                let entry = self.tool_calls_by_index.entry(tool_call.index).or_default();
469
470                if let Some(tool_id) = tool_call.id.clone() {
471                    entry.id = tool_id;
472                }
473
474                if let Some(function) = tool_call.function.as_ref() {
475                    if let Some(name) = function.name.clone() {
476                        entry.name = name;
477                    }
478
479                    if let Some(arguments) = function.arguments.clone() {
480                        entry.arguments.push_str(&arguments);
481                    }
482                }
483            }
484        }
485
486        if let Some(usage) = event.usage {
487            events.push(Ok(LanguageModelCompletionEvent::UsageUpdate(TokenUsage {
488                input_tokens: usage.prompt_tokens,
489                output_tokens: usage.completion_tokens,
490                cache_creation_input_tokens: 0,
491                cache_read_input_tokens: 0,
492            })));
493        }
494
495        match choice.finish_reason.as_deref() {
496            Some("stop") => {
497                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
498            }
499            Some("tool_calls") => {
500                events.extend(self.tool_calls_by_index.drain().map(|(_, tool_call)| {
501                    match serde_json::Value::from_str(&tool_call.arguments) {
502                        Ok(input) => Ok(LanguageModelCompletionEvent::ToolUse(
503                            LanguageModelToolUse {
504                                id: tool_call.id.clone().into(),
505                                name: tool_call.name.as_str().into(),
506                                is_input_complete: true,
507                                input,
508                                raw_input: tool_call.arguments.clone(),
509                            },
510                        )),
511                        Err(error) => Ok(LanguageModelCompletionEvent::ToolUseJsonParseError {
512                            id: tool_call.id.clone().into(),
513                            tool_name: tool_call.name.as_str().into(),
514                            raw_input: tool_call.arguments.into(),
515                            json_parse_error: error.to_string(),
516                        }),
517                    }
518                }));
519
520                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::ToolUse)));
521            }
522            Some(stop_reason) => {
523                log::error!("Unexpected DeepSeek stop_reason: {stop_reason:?}",);
524                events.push(Ok(LanguageModelCompletionEvent::Stop(StopReason::EndTurn)));
525            }
526            None => {}
527        }
528
529        events
530    }
531}
532
533struct ConfigurationView {
534    api_key_editor: Entity<Editor>,
535    state: Entity<State>,
536    load_credentials_task: Option<Task<()>>,
537}
538
539impl ConfigurationView {
540    fn new(state: Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
541        let api_key_editor = cx.new(|cx| {
542            let mut editor = Editor::single_line(window, cx);
543            editor.set_placeholder_text("sk-00000000000000000000000000000000", window, cx);
544            editor
545        });
546
547        cx.observe(&state, |_, _, cx| {
548            cx.notify();
549        })
550        .detach();
551
552        let load_credentials_task = Some(cx.spawn({
553            let state = state.clone();
554            async move |this, cx| {
555                if let Some(task) = state
556                    .update(cx, |state, cx| state.authenticate(cx))
557                    .log_err()
558                {
559                    let _ = task.await;
560                }
561
562                this.update(cx, |this, cx| {
563                    this.load_credentials_task = None;
564                    cx.notify();
565                })
566                .log_err();
567            }
568        }));
569
570        Self {
571            api_key_editor,
572            state,
573            load_credentials_task,
574        }
575    }
576
577    fn save_api_key(&mut self, _: &menu::Confirm, _window: &mut Window, cx: &mut Context<Self>) {
578        let api_key = self.api_key_editor.read(cx).text(cx).trim().to_string();
579        if api_key.is_empty() {
580            return;
581        }
582
583        let state = self.state.clone();
584        cx.spawn(async move |_, cx| {
585            state
586                .update(cx, |state, cx| state.set_api_key(Some(api_key), cx))?
587                .await
588        })
589        .detach_and_log_err(cx);
590    }
591
592    fn reset_api_key(&mut self, window: &mut Window, cx: &mut Context<Self>) {
593        self.api_key_editor
594            .update(cx, |editor, cx| editor.set_text("", window, cx));
595
596        let state = self.state.clone();
597        cx.spawn(async move |_, cx| {
598            state
599                .update(cx, |state, cx| state.set_api_key(None, cx))?
600                .await
601        })
602        .detach_and_log_err(cx);
603    }
604
605    fn render_api_key_editor(&self, cx: &mut Context<Self>) -> impl IntoElement {
606        let settings = ThemeSettings::get_global(cx);
607        let text_style = TextStyle {
608            color: cx.theme().colors().text,
609            font_family: settings.ui_font.family.clone(),
610            font_features: settings.ui_font.features.clone(),
611            font_fallbacks: settings.ui_font.fallbacks.clone(),
612            font_size: rems(0.875).into(),
613            font_weight: settings.ui_font.weight,
614            font_style: FontStyle::Normal,
615            line_height: relative(1.3),
616            background_color: None,
617            underline: None,
618            strikethrough: None,
619            white_space: WhiteSpace::Normal,
620            ..Default::default()
621        };
622        EditorElement::new(
623            &self.api_key_editor,
624            EditorStyle {
625                background: cx.theme().colors().editor_background,
626                local_player: cx.theme().players().local(),
627                text: text_style,
628                ..Default::default()
629            },
630        )
631    }
632
633    fn should_render_editor(&self, cx: &mut Context<Self>) -> bool {
634        !self.state.read(cx).is_authenticated()
635    }
636}
637
638impl Render for ConfigurationView {
639    fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
640        let env_var_set = self.state.read(cx).api_key_state.is_from_env_var();
641
642        if self.load_credentials_task.is_some() {
643            div().child(Label::new("Loading credentials...")).into_any()
644        } else if self.should_render_editor(cx) {
645            v_flex()
646                .size_full()
647                .on_action(cx.listener(Self::save_api_key))
648                .child(Label::new("To use DeepSeek in Zed, you need an API key:"))
649                .child(
650                    List::new()
651                        .child(InstructionListItem::new(
652                            "Get your API key from the",
653                            Some("DeepSeek console"),
654                            Some("https://platform.deepseek.com/api_keys"),
655                        ))
656                        .child(InstructionListItem::text_only(
657                            "Paste your API key below and hit enter to start using the assistant",
658                        )),
659                )
660                .child(
661                    h_flex()
662                        .w_full()
663                        .my_2()
664                        .px_2()
665                        .py_1()
666                        .bg(cx.theme().colors().editor_background)
667                        .border_1()
668                        .border_color(cx.theme().colors().border)
669                        .rounded_sm()
670                        .child(self.render_api_key_editor(cx)),
671                )
672                .child(
673                    Label::new(format!(
674                        "Or set the {API_KEY_ENV_VAR_NAME} environment variable."
675                    ))
676                    .size(LabelSize::Small)
677                    .color(Color::Muted),
678                )
679                .into_any()
680        } else {
681            h_flex()
682                .mt_1()
683                .p_1()
684                .justify_between()
685                .rounded_md()
686                .border_1()
687                .border_color(cx.theme().colors().border)
688                .bg(cx.theme().colors().background)
689                .child(
690                    h_flex()
691                        .gap_1()
692                        .child(Icon::new(IconName::Check).color(Color::Success))
693                        .child(Label::new(if env_var_set {
694                            format!("API key set in {API_KEY_ENV_VAR_NAME}")
695                        } else {
696                            "API key configured".to_string()
697                        })),
698                )
699                .child(
700                    Button::new("reset-key", "Reset Key")
701                        .label_size(LabelSize::Small)
702                        .icon(Some(IconName::Trash))
703                        .icon_size(IconSize::Small)
704                        .icon_position(IconPosition::Start)
705                        .disabled(env_var_set)
706                        .on_click(
707                            cx.listener(|this, _, window, cx| this.reset_api_key(window, cx)),
708                        ),
709                )
710                .into_any()
711        }
712    }
713}