1use std::pin::Pin;
2use std::str::FromStr;
3use std::sync::Arc;
4
5use crate::ui::InstructionListItem;
6use anyhow::{Context as _, Result, anyhow};
7use aws_config::stalled_stream_protection::StalledStreamProtectionConfig;
8use aws_config::{BehaviorVersion, Region};
9use aws_credential_types::Credentials;
10use aws_http_client::AwsHttpClient;
11use bedrock::bedrock_client::Client as BedrockClient;
12use bedrock::bedrock_client::config::timeout::TimeoutConfig;
13use bedrock::bedrock_client::types::{
14 ContentBlockDelta, ContentBlockStart, ConverseStreamOutput, ReasoningContentBlockDelta,
15 StopReason,
16};
17use bedrock::{
18 BedrockAnyToolChoice, BedrockAutoToolChoice, BedrockBlob, BedrockError, BedrockInnerContent,
19 BedrockMessage, BedrockModelMode, BedrockStreamingResponse, BedrockThinkingBlock,
20 BedrockThinkingTextBlock, BedrockTool, BedrockToolChoice, BedrockToolConfig,
21 BedrockToolInputSchema, BedrockToolResultBlock, BedrockToolResultContentBlock,
22 BedrockToolResultStatus, BedrockToolSpec, BedrockToolUseBlock, Model, value_to_aws_document,
23};
24use collections::{BTreeMap, HashMap};
25use credentials_provider::CredentialsProvider;
26use editor::{Editor, EditorElement, EditorStyle};
27use futures::{FutureExt, Stream, StreamExt, future::BoxFuture, stream::BoxStream};
28use gpui::{
29 AnyView, App, AsyncApp, Context, Entity, FontStyle, FontWeight, Subscription, Task, TextStyle,
30 WhiteSpace,
31};
32use gpui_tokio::Tokio;
33use http_client::HttpClient;
34use language_model::{
35 AuthenticateError, LanguageModel, LanguageModelCacheConfiguration,
36 LanguageModelCompletionError, LanguageModelCompletionEvent, LanguageModelId, LanguageModelName,
37 LanguageModelProvider, LanguageModelProviderId, LanguageModelProviderName,
38 LanguageModelProviderState, LanguageModelRequest, LanguageModelToolChoice,
39 LanguageModelToolResultContent, LanguageModelToolUse, MessageContent, RateLimiter, Role,
40 TokenUsage,
41};
42use schemars::JsonSchema;
43use serde::{Deserialize, Serialize};
44use serde_json::Value;
45use settings::{Settings, SettingsStore};
46use smol::lock::OnceCell;
47use strum::{EnumIter, IntoEnumIterator, IntoStaticStr};
48use theme::ThemeSettings;
49use tokio::runtime::Handle;
50use ui::{Icon, IconName, List, Tooltip, prelude::*};
51use util::{ResultExt, default};
52
53use crate::AllLanguageModelSettings;
54
55const PROVIDER_ID: &str = "amazon-bedrock";
56const PROVIDER_NAME: &str = "Amazon Bedrock";
57
58#[derive(Default, Clone, Deserialize, Serialize, PartialEq, Debug)]
59pub struct BedrockCredentials {
60 pub access_key_id: String,
61 pub secret_access_key: String,
62 pub session_token: Option<String>,
63 pub region: String,
64}
65
66#[derive(Default, Clone, Debug, PartialEq)]
67pub struct AmazonBedrockSettings {
68 pub available_models: Vec<AvailableModel>,
69 pub region: Option<String>,
70 pub endpoint: Option<String>,
71 pub profile_name: Option<String>,
72 pub role_arn: Option<String>,
73 pub authentication_method: Option<BedrockAuthMethod>,
74}
75
76#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, EnumIter, IntoStaticStr, JsonSchema)]
77pub enum BedrockAuthMethod {
78 #[serde(rename = "named_profile")]
79 NamedProfile,
80 #[serde(rename = "sso")]
81 SingleSignOn,
82 /// IMDSv2, PodIdentity, env vars, etc.
83 #[serde(rename = "default")]
84 Automatic,
85}
86
87#[derive(Clone, Debug, PartialEq, Serialize, Deserialize, JsonSchema)]
88pub struct AvailableModel {
89 pub name: String,
90 pub display_name: Option<String>,
91 pub max_tokens: u64,
92 pub cache_configuration: Option<LanguageModelCacheConfiguration>,
93 pub max_output_tokens: Option<u64>,
94 pub default_temperature: Option<f32>,
95 pub mode: Option<ModelMode>,
96}
97
98#[derive(Clone, Debug, Default, PartialEq, Serialize, Deserialize, JsonSchema)]
99#[serde(tag = "type", rename_all = "lowercase")]
100pub enum ModelMode {
101 #[default]
102 Default,
103 Thinking {
104 /// The maximum number of tokens to use for reasoning. Must be lower than the model's `max_output_tokens`.
105 budget_tokens: Option<u64>,
106 },
107}
108
109impl From<ModelMode> for BedrockModelMode {
110 fn from(value: ModelMode) -> Self {
111 match value {
112 ModelMode::Default => BedrockModelMode::Default,
113 ModelMode::Thinking { budget_tokens } => BedrockModelMode::Thinking { budget_tokens },
114 }
115 }
116}
117
118impl From<BedrockModelMode> for ModelMode {
119 fn from(value: BedrockModelMode) -> Self {
120 match value {
121 BedrockModelMode::Default => ModelMode::Default,
122 BedrockModelMode::Thinking { budget_tokens } => ModelMode::Thinking { budget_tokens },
123 }
124 }
125}
126
127/// The URL of the base AWS service.
128///
129/// Right now we're just using this as the key to store the AWS credentials
130/// under in the keychain.
131const AMAZON_AWS_URL: &str = "https://amazonaws.com";
132
133// These environment variables all use a `ZED_` prefix because we don't want to overwrite the user's AWS credentials.
134const ZED_BEDROCK_ACCESS_KEY_ID_VAR: &str = "ZED_ACCESS_KEY_ID";
135const ZED_BEDROCK_SECRET_ACCESS_KEY_VAR: &str = "ZED_SECRET_ACCESS_KEY";
136const ZED_BEDROCK_SESSION_TOKEN_VAR: &str = "ZED_SESSION_TOKEN";
137const ZED_AWS_PROFILE_VAR: &str = "ZED_AWS_PROFILE";
138const ZED_BEDROCK_REGION_VAR: &str = "ZED_AWS_REGION";
139const ZED_AWS_CREDENTIALS_VAR: &str = "ZED_AWS_CREDENTIALS";
140const ZED_AWS_ENDPOINT_VAR: &str = "ZED_AWS_ENDPOINT";
141
142pub struct State {
143 credentials: Option<BedrockCredentials>,
144 settings: Option<AmazonBedrockSettings>,
145 credentials_from_env: bool,
146 _subscription: Subscription,
147}
148
149impl State {
150 fn reset_credentials(&self, cx: &mut Context<Self>) -> Task<Result<()>> {
151 let credentials_provider = <dyn CredentialsProvider>::global(cx);
152 cx.spawn(async move |this, cx| {
153 credentials_provider
154 .delete_credentials(AMAZON_AWS_URL, &cx)
155 .await
156 .log_err();
157 this.update(cx, |this, cx| {
158 this.credentials = None;
159 this.credentials_from_env = false;
160 this.settings = None;
161 cx.notify();
162 })
163 })
164 }
165
166 fn set_credentials(
167 &mut self,
168 credentials: BedrockCredentials,
169 cx: &mut Context<Self>,
170 ) -> Task<Result<()>> {
171 let credentials_provider = <dyn CredentialsProvider>::global(cx);
172 cx.spawn(async move |this, cx| {
173 credentials_provider
174 .write_credentials(
175 AMAZON_AWS_URL,
176 "Bearer",
177 &serde_json::to_vec(&credentials)?,
178 &cx,
179 )
180 .await?;
181 this.update(cx, |this, cx| {
182 this.credentials = Some(credentials);
183 cx.notify();
184 })
185 })
186 }
187
188 fn is_authenticated(&self) -> bool {
189 let derived = self
190 .settings
191 .as_ref()
192 .and_then(|s| s.authentication_method.as_ref());
193 let creds = self.credentials.as_ref();
194
195 derived.is_some() || creds.is_some()
196 }
197
198 fn authenticate(&self, cx: &mut Context<Self>) -> Task<Result<(), AuthenticateError>> {
199 if self.is_authenticated() {
200 return Task::ready(Ok(()));
201 }
202
203 let credentials_provider = <dyn CredentialsProvider>::global(cx);
204 cx.spawn(async move |this, cx| {
205 let (credentials, from_env) =
206 if let Ok(credentials) = std::env::var(ZED_AWS_CREDENTIALS_VAR) {
207 (credentials, true)
208 } else {
209 let (_, credentials) = credentials_provider
210 .read_credentials(AMAZON_AWS_URL, &cx)
211 .await?
212 .ok_or_else(|| AuthenticateError::CredentialsNotFound)?;
213 (
214 String::from_utf8(credentials)
215 .context("invalid {PROVIDER_NAME} credentials")?,
216 false,
217 )
218 };
219
220 let credentials: BedrockCredentials =
221 serde_json::from_str(&credentials).context("failed to parse credentials")?;
222
223 this.update(cx, |this, cx| {
224 this.credentials = Some(credentials);
225 this.credentials_from_env = from_env;
226 cx.notify();
227 })?;
228
229 Ok(())
230 })
231 }
232
233 fn get_region(&self) -> String {
234 // Get region - from credentials or directly from settings
235 let credentials_region = self.credentials.as_ref().map(|s| s.region.clone());
236 let settings_region = self.settings.as_ref().and_then(|s| s.region.clone());
237
238 // Use credentials region if available, otherwise use settings region, finally fall back to default
239 credentials_region
240 .or(settings_region)
241 .unwrap_or(String::from("us-east-1"))
242 }
243}
244
245pub struct BedrockLanguageModelProvider {
246 http_client: AwsHttpClient,
247 handler: tokio::runtime::Handle,
248 state: gpui::Entity<State>,
249}
250
251impl BedrockLanguageModelProvider {
252 pub fn new(http_client: Arc<dyn HttpClient>, cx: &mut App) -> Self {
253 let state = cx.new(|cx| State {
254 credentials: None,
255 settings: Some(AllLanguageModelSettings::get_global(cx).bedrock.clone()),
256 credentials_from_env: false,
257 _subscription: cx.observe_global::<SettingsStore>(|_, cx| {
258 cx.notify();
259 }),
260 });
261
262 let tokio_handle = Tokio::handle(cx);
263
264 let coerced_client = AwsHttpClient::new(http_client.clone(), tokio_handle.clone());
265
266 Self {
267 http_client: coerced_client,
268 handler: tokio_handle.clone(),
269 state,
270 }
271 }
272
273 fn create_language_model(&self, model: bedrock::Model) -> Arc<dyn LanguageModel> {
274 Arc::new(BedrockModel {
275 id: LanguageModelId::from(model.id().to_string()),
276 model,
277 http_client: self.http_client.clone(),
278 handler: self.handler.clone(),
279 state: self.state.clone(),
280 client: OnceCell::new(),
281 request_limiter: RateLimiter::new(4),
282 })
283 }
284}
285
286impl LanguageModelProvider for BedrockLanguageModelProvider {
287 fn id(&self) -> LanguageModelProviderId {
288 LanguageModelProviderId(PROVIDER_ID.into())
289 }
290
291 fn name(&self) -> LanguageModelProviderName {
292 LanguageModelProviderName(PROVIDER_NAME.into())
293 }
294
295 fn icon(&self) -> IconName {
296 IconName::AiBedrock
297 }
298
299 fn default_model(&self, _cx: &App) -> Option<Arc<dyn LanguageModel>> {
300 Some(self.create_language_model(bedrock::Model::default()))
301 }
302
303 fn default_fast_model(&self, cx: &App) -> Option<Arc<dyn LanguageModel>> {
304 let region = self.state.read(cx).get_region();
305 Some(self.create_language_model(bedrock::Model::default_fast(region.as_str())))
306 }
307
308 fn provided_models(&self, cx: &App) -> Vec<Arc<dyn LanguageModel>> {
309 let mut models = BTreeMap::default();
310
311 for model in bedrock::Model::iter() {
312 if !matches!(model, bedrock::Model::Custom { .. }) {
313 // TODO: Sonnet 3.7 vs. 3.7 Thinking bug is here.
314 models.insert(model.id().to_string(), model);
315 }
316 }
317
318 // Override with available models from settings
319 for model in AllLanguageModelSettings::get_global(cx)
320 .bedrock
321 .available_models
322 .iter()
323 {
324 models.insert(
325 model.name.clone(),
326 bedrock::Model::Custom {
327 name: model.name.clone(),
328 display_name: model.display_name.clone(),
329 max_tokens: model.max_tokens,
330 max_output_tokens: model.max_output_tokens,
331 default_temperature: model.default_temperature,
332 },
333 );
334 }
335
336 models
337 .into_values()
338 .map(|model| self.create_language_model(model))
339 .collect()
340 }
341
342 fn is_authenticated(&self, cx: &App) -> bool {
343 self.state.read(cx).is_authenticated()
344 }
345
346 fn authenticate(&self, cx: &mut App) -> Task<Result<(), AuthenticateError>> {
347 self.state.update(cx, |state, cx| state.authenticate(cx))
348 }
349
350 fn configuration_view(&self, window: &mut Window, cx: &mut App) -> AnyView {
351 cx.new(|cx| ConfigurationView::new(self.state.clone(), window, cx))
352 .into()
353 }
354
355 fn reset_credentials(&self, cx: &mut App) -> Task<Result<()>> {
356 self.state
357 .update(cx, |state, cx| state.reset_credentials(cx))
358 }
359}
360
361impl LanguageModelProviderState for BedrockLanguageModelProvider {
362 type ObservableEntity = State;
363
364 fn observable_entity(&self) -> Option<gpui::Entity<Self::ObservableEntity>> {
365 Some(self.state.clone())
366 }
367}
368
369struct BedrockModel {
370 id: LanguageModelId,
371 model: Model,
372 http_client: AwsHttpClient,
373 handler: tokio::runtime::Handle,
374 client: OnceCell<BedrockClient>,
375 state: gpui::Entity<State>,
376 request_limiter: RateLimiter,
377}
378
379impl BedrockModel {
380 fn get_or_init_client(&self, cx: &AsyncApp) -> anyhow::Result<&BedrockClient> {
381 self.client
382 .get_or_try_init_blocking(|| {
383 let (auth_method, credentials, endpoint, region, settings) =
384 cx.read_entity(&self.state, |state, _cx| {
385 let auth_method = state
386 .settings
387 .as_ref()
388 .and_then(|s| s.authentication_method.clone());
389
390 let endpoint = state.settings.as_ref().and_then(|s| s.endpoint.clone());
391
392 let region = state.get_region();
393
394 (
395 auth_method,
396 state.credentials.clone(),
397 endpoint,
398 region,
399 state.settings.clone(),
400 )
401 })?;
402
403 let mut config_builder = aws_config::defaults(BehaviorVersion::latest())
404 .stalled_stream_protection(StalledStreamProtectionConfig::disabled())
405 .http_client(self.http_client.clone())
406 .region(Region::new(region))
407 .timeout_config(TimeoutConfig::disabled());
408
409 if let Some(endpoint_url) = endpoint {
410 if !endpoint_url.is_empty() {
411 config_builder = config_builder.endpoint_url(endpoint_url);
412 }
413 }
414
415 match auth_method {
416 None => {
417 if let Some(creds) = credentials {
418 let aws_creds = Credentials::new(
419 creds.access_key_id,
420 creds.secret_access_key,
421 creds.session_token,
422 None,
423 "zed-bedrock-provider",
424 );
425 config_builder = config_builder.credentials_provider(aws_creds);
426 }
427 }
428 Some(BedrockAuthMethod::NamedProfile)
429 | Some(BedrockAuthMethod::SingleSignOn) => {
430 // Currently NamedProfile and SSO behave the same way but only the instructions change
431 // Until we support BearerAuth through SSO, this will not change.
432 let profile_name = settings
433 .and_then(|s| s.profile_name)
434 .unwrap_or_else(|| "default".to_string());
435
436 if !profile_name.is_empty() {
437 config_builder = config_builder.profile_name(profile_name);
438 }
439 }
440 Some(BedrockAuthMethod::Automatic) => {
441 // Use default credential provider chain
442 }
443 }
444
445 let config = self.handler.block_on(config_builder.load());
446 anyhow::Ok(BedrockClient::new(&config))
447 })
448 .context("initializing Bedrock client")?;
449
450 self.client.get().context("Bedrock client not initialized")
451 }
452
453 fn stream_completion(
454 &self,
455 request: bedrock::Request,
456 cx: &AsyncApp,
457 ) -> Result<
458 BoxFuture<'static, BoxStream<'static, Result<BedrockStreamingResponse, BedrockError>>>,
459 > {
460 let runtime_client = self
461 .get_or_init_client(cx)
462 .cloned()
463 .context("Bedrock client not initialized")?;
464 let owned_handle = self.handler.clone();
465
466 Ok(async move {
467 let request = bedrock::stream_completion(runtime_client, request, owned_handle);
468 request.await.unwrap_or_else(|e| {
469 futures::stream::once(async move { Err(BedrockError::ClientError(e)) }).boxed()
470 })
471 }
472 .boxed())
473 }
474}
475
476impl LanguageModel for BedrockModel {
477 fn id(&self) -> LanguageModelId {
478 self.id.clone()
479 }
480
481 fn name(&self) -> LanguageModelName {
482 LanguageModelName::from(self.model.display_name().to_string())
483 }
484
485 fn provider_id(&self) -> LanguageModelProviderId {
486 LanguageModelProviderId(PROVIDER_ID.into())
487 }
488
489 fn provider_name(&self) -> LanguageModelProviderName {
490 LanguageModelProviderName(PROVIDER_NAME.into())
491 }
492
493 fn supports_tools(&self) -> bool {
494 self.model.supports_tool_use()
495 }
496
497 fn supports_images(&self) -> bool {
498 false
499 }
500
501 fn supports_tool_choice(&self, choice: LanguageModelToolChoice) -> bool {
502 match choice {
503 LanguageModelToolChoice::Auto | LanguageModelToolChoice::Any => {
504 self.model.supports_tool_use()
505 }
506 LanguageModelToolChoice::None => false,
507 }
508 }
509
510 fn telemetry_id(&self) -> String {
511 format!("bedrock/{}", self.model.id())
512 }
513
514 fn max_token_count(&self) -> u64 {
515 self.model.max_token_count()
516 }
517
518 fn max_output_tokens(&self) -> Option<u64> {
519 Some(self.model.max_output_tokens())
520 }
521
522 fn count_tokens(
523 &self,
524 request: LanguageModelRequest,
525 cx: &App,
526 ) -> BoxFuture<'static, Result<u64>> {
527 get_bedrock_tokens(request, cx)
528 }
529
530 fn stream_completion(
531 &self,
532 request: LanguageModelRequest,
533 cx: &AsyncApp,
534 ) -> BoxFuture<
535 'static,
536 Result<
537 BoxStream<'static, Result<LanguageModelCompletionEvent, LanguageModelCompletionError>>,
538 LanguageModelCompletionError,
539 >,
540 > {
541 let Ok(region) = cx.read_entity(&self.state, |state, _cx| state.get_region()) else {
542 return async move { Err(anyhow::anyhow!("App State Dropped").into()) }.boxed();
543 };
544
545 let model_id = match self.model.cross_region_inference_id(®ion) {
546 Ok(s) => s,
547 Err(e) => {
548 return async move { Err(e.into()) }.boxed();
549 }
550 };
551
552 let request = match into_bedrock(
553 request,
554 model_id,
555 self.model.default_temperature(),
556 self.model.max_output_tokens(),
557 self.model.mode(),
558 ) {
559 Ok(request) => request,
560 Err(err) => return futures::future::ready(Err(err.into())).boxed(),
561 };
562
563 let owned_handle = self.handler.clone();
564
565 let request = self.stream_completion(request, cx);
566 let future = self.request_limiter.stream(async move {
567 let response = request.map_err(|err| anyhow!(err))?.await;
568 Ok(map_to_language_model_completion_events(
569 response,
570 owned_handle,
571 ))
572 });
573 async move { Ok(future.await?.boxed()) }.boxed()
574 }
575
576 fn cache_configuration(&self) -> Option<LanguageModelCacheConfiguration> {
577 None
578 }
579}
580
581pub fn into_bedrock(
582 request: LanguageModelRequest,
583 model: String,
584 default_temperature: f32,
585 max_output_tokens: u64,
586 mode: BedrockModelMode,
587) -> Result<bedrock::Request> {
588 let mut new_messages: Vec<BedrockMessage> = Vec::new();
589 let mut system_message = String::new();
590
591 for message in request.messages {
592 if message.contents_empty() {
593 continue;
594 }
595
596 match message.role {
597 Role::User | Role::Assistant => {
598 let bedrock_message_content: Vec<BedrockInnerContent> = message
599 .content
600 .into_iter()
601 .filter_map(|content| match content {
602 MessageContent::Text(text) => {
603 if !text.is_empty() {
604 Some(BedrockInnerContent::Text(text))
605 } else {
606 None
607 }
608 }
609 MessageContent::Thinking { text, signature } => {
610 let thinking = BedrockThinkingTextBlock::builder()
611 .text(text)
612 .set_signature(signature)
613 .build()
614 .context("failed to build reasoning block")
615 .log_err()?;
616
617 Some(BedrockInnerContent::ReasoningContent(
618 BedrockThinkingBlock::ReasoningText(thinking),
619 ))
620 }
621 MessageContent::RedactedThinking(blob) => {
622 let redacted =
623 BedrockThinkingBlock::RedactedContent(BedrockBlob::new(blob));
624
625 Some(BedrockInnerContent::ReasoningContent(redacted))
626 }
627 MessageContent::ToolUse(tool_use) => BedrockToolUseBlock::builder()
628 .name(tool_use.name.to_string())
629 .tool_use_id(tool_use.id.to_string())
630 .input(value_to_aws_document(&tool_use.input))
631 .build()
632 .context("failed to build Bedrock tool use block")
633 .log_err()
634 .map(BedrockInnerContent::ToolUse),
635 MessageContent::ToolResult(tool_result) => {
636 BedrockToolResultBlock::builder()
637 .tool_use_id(tool_result.tool_use_id.to_string())
638 .content(match tool_result.content {
639 LanguageModelToolResultContent::Text(text) => {
640 BedrockToolResultContentBlock::Text(text.to_string())
641 }
642 LanguageModelToolResultContent::Image(_) => {
643 BedrockToolResultContentBlock::Text(
644 // TODO: Bedrock image support
645 "[Tool responded with an image, but Zed doesn't support these in Bedrock models yet]".to_string()
646 )
647 }
648 })
649 .status({
650 if tool_result.is_error {
651 BedrockToolResultStatus::Error
652 } else {
653 BedrockToolResultStatus::Success
654 }
655 })
656 .build()
657 .context("failed to build Bedrock tool result block")
658 .log_err()
659 .map(BedrockInnerContent::ToolResult)
660 }
661 _ => None,
662 })
663 .collect();
664 let bedrock_role = match message.role {
665 Role::User => bedrock::BedrockRole::User,
666 Role::Assistant => bedrock::BedrockRole::Assistant,
667 Role::System => unreachable!("System role should never occur here"),
668 };
669 if let Some(last_message) = new_messages.last_mut() {
670 if last_message.role == bedrock_role {
671 last_message.content.extend(bedrock_message_content);
672 continue;
673 }
674 }
675 new_messages.push(
676 BedrockMessage::builder()
677 .role(bedrock_role)
678 .set_content(Some(bedrock_message_content))
679 .build()
680 .context("failed to build Bedrock message")?,
681 );
682 }
683 Role::System => {
684 if !system_message.is_empty() {
685 system_message.push_str("\n\n");
686 }
687 system_message.push_str(&message.string_contents());
688 }
689 }
690 }
691
692 let tool_spec: Vec<BedrockTool> = request
693 .tools
694 .iter()
695 .filter_map(|tool| {
696 Some(BedrockTool::ToolSpec(
697 BedrockToolSpec::builder()
698 .name(tool.name.clone())
699 .description(tool.description.clone())
700 .input_schema(BedrockToolInputSchema::Json(value_to_aws_document(
701 &tool.input_schema,
702 )))
703 .build()
704 .log_err()?,
705 ))
706 })
707 .collect();
708
709 let tool_choice = match request.tool_choice {
710 Some(LanguageModelToolChoice::Auto) | None => {
711 BedrockToolChoice::Auto(BedrockAutoToolChoice::builder().build())
712 }
713 Some(LanguageModelToolChoice::Any) => {
714 BedrockToolChoice::Any(BedrockAnyToolChoice::builder().build())
715 }
716 Some(LanguageModelToolChoice::None) => {
717 anyhow::bail!("LanguageModelToolChoice::None is not supported");
718 }
719 };
720 let tool_config: BedrockToolConfig = BedrockToolConfig::builder()
721 .set_tools(Some(tool_spec))
722 .tool_choice(tool_choice)
723 .build()?;
724
725 Ok(bedrock::Request {
726 model,
727 messages: new_messages,
728 max_tokens: max_output_tokens,
729 system: Some(system_message),
730 tools: Some(tool_config),
731 thinking: if let BedrockModelMode::Thinking { budget_tokens } = mode {
732 Some(bedrock::Thinking::Enabled { budget_tokens })
733 } else {
734 None
735 },
736 metadata: None,
737 stop_sequences: Vec::new(),
738 temperature: request.temperature.or(Some(default_temperature)),
739 top_k: None,
740 top_p: None,
741 })
742}
743
744// TODO: just call the ConverseOutput.usage() method:
745// https://docs.rs/aws-sdk-bedrockruntime/latest/aws_sdk_bedrockruntime/operation/converse/struct.ConverseOutput.html#method.output
746pub fn get_bedrock_tokens(
747 request: LanguageModelRequest,
748 cx: &App,
749) -> BoxFuture<'static, Result<u64>> {
750 cx.background_executor()
751 .spawn(async move {
752 let messages = request.messages;
753 let mut tokens_from_images = 0;
754 let mut string_messages = Vec::with_capacity(messages.len());
755
756 for message in messages {
757 use language_model::MessageContent;
758
759 let mut string_contents = String::new();
760
761 for content in message.content {
762 match content {
763 MessageContent::Text(text) | MessageContent::Thinking { text, .. } => {
764 string_contents.push_str(&text);
765 }
766 MessageContent::RedactedThinking(_) => {}
767 MessageContent::Image(image) => {
768 tokens_from_images += image.estimate_tokens();
769 }
770 MessageContent::ToolUse(_tool_use) => {
771 // TODO: Estimate token usage from tool uses.
772 }
773 MessageContent::ToolResult(tool_result) => match tool_result.content {
774 LanguageModelToolResultContent::Text(text) => {
775 string_contents.push_str(&text);
776 }
777 LanguageModelToolResultContent::Image(image) => {
778 tokens_from_images += image.estimate_tokens();
779 }
780 },
781 }
782 }
783
784 if !string_contents.is_empty() {
785 string_messages.push(tiktoken_rs::ChatCompletionRequestMessage {
786 role: match message.role {
787 Role::User => "user".into(),
788 Role::Assistant => "assistant".into(),
789 Role::System => "system".into(),
790 },
791 content: Some(string_contents),
792 name: None,
793 function_call: None,
794 });
795 }
796 }
797
798 // Tiktoken doesn't yet support these models, so we manually use the
799 // same tokenizer as GPT-4.
800 tiktoken_rs::num_tokens_from_messages("gpt-4", &string_messages)
801 .map(|tokens| (tokens + tokens_from_images) as u64)
802 })
803 .boxed()
804}
805
806pub fn map_to_language_model_completion_events(
807 events: Pin<Box<dyn Send + Stream<Item = Result<BedrockStreamingResponse, BedrockError>>>>,
808 handle: Handle,
809) -> impl Stream<Item = Result<LanguageModelCompletionEvent, LanguageModelCompletionError>> {
810 struct RawToolUse {
811 id: String,
812 name: String,
813 input_json: String,
814 }
815
816 struct State {
817 events: Pin<Box<dyn Send + Stream<Item = Result<BedrockStreamingResponse, BedrockError>>>>,
818 tool_uses_by_index: HashMap<i32, RawToolUse>,
819 }
820
821 futures::stream::unfold(
822 State {
823 events,
824 tool_uses_by_index: HashMap::default(),
825 },
826 move |mut state: State| {
827 let inner_handle = handle.clone();
828 async move {
829 inner_handle
830 .spawn(async {
831 while let Some(event) = state.events.next().await {
832 match event {
833 Ok(event) => match event {
834 ConverseStreamOutput::ContentBlockDelta(cb_delta) => {
835 match cb_delta.delta {
836 Some(ContentBlockDelta::Text(text_out)) => {
837 let completion_event =
838 LanguageModelCompletionEvent::Text(text_out);
839 return Some((Some(Ok(completion_event)), state));
840 }
841
842 Some(ContentBlockDelta::ToolUse(text_out)) => {
843 if let Some(tool_use) = state
844 .tool_uses_by_index
845 .get_mut(&cb_delta.content_block_index)
846 {
847 tool_use.input_json.push_str(text_out.input());
848 }
849 }
850
851 Some(ContentBlockDelta::ReasoningContent(thinking)) => {
852 match thinking {
853 ReasoningContentBlockDelta::RedactedContent(
854 redacted,
855 ) => {
856 let thinking_event =
857 LanguageModelCompletionEvent::Thinking {
858 text: String::from_utf8(
859 redacted.into_inner(),
860 )
861 .unwrap_or("REDACTED".to_string()),
862 signature: None,
863 };
864
865 return Some((
866 Some(Ok(thinking_event)),
867 state,
868 ));
869 }
870 ReasoningContentBlockDelta::Signature(
871 signature,
872 ) => {
873 return Some((
874 Some(Ok(LanguageModelCompletionEvent::Thinking {
875 text: "".to_string(),
876 signature: Some(signature)
877 })),
878 state,
879 ));
880 }
881 ReasoningContentBlockDelta::Text(thoughts) => {
882 let thinking_event =
883 LanguageModelCompletionEvent::Thinking {
884 text: thoughts.to_string(),
885 signature: None
886 };
887
888 return Some((
889 Some(Ok(thinking_event)),
890 state,
891 ));
892 }
893 _ => {}
894 }
895 }
896 _ => {}
897 }
898 }
899 ConverseStreamOutput::ContentBlockStart(cb_start) => {
900 if let Some(ContentBlockStart::ToolUse(text_out)) =
901 cb_start.start
902 {
903 let tool_use = RawToolUse {
904 id: text_out.tool_use_id,
905 name: text_out.name,
906 input_json: String::new(),
907 };
908
909 state
910 .tool_uses_by_index
911 .insert(cb_start.content_block_index, tool_use);
912 }
913 }
914 ConverseStreamOutput::ContentBlockStop(cb_stop) => {
915 if let Some(tool_use) = state
916 .tool_uses_by_index
917 .remove(&cb_stop.content_block_index)
918 {
919 let tool_use_event = LanguageModelToolUse {
920 id: tool_use.id.into(),
921 name: tool_use.name.into(),
922 is_input_complete: true,
923 raw_input: tool_use.input_json.clone(),
924 input: if tool_use.input_json.is_empty() {
925 Value::Null
926 } else {
927 serde_json::Value::from_str(
928 &tool_use.input_json,
929 )
930 .map_err(|err| anyhow!(err))
931 .unwrap()
932 },
933 };
934
935 return Some((
936 Some(Ok(LanguageModelCompletionEvent::ToolUse(
937 tool_use_event,
938 ))),
939 state,
940 ));
941 }
942 }
943
944 ConverseStreamOutput::Metadata(cb_meta) => {
945 if let Some(metadata) = cb_meta.usage {
946 let completion_event =
947 LanguageModelCompletionEvent::UsageUpdate(
948 TokenUsage {
949 input_tokens: metadata.input_tokens as u64,
950 output_tokens: metadata.output_tokens
951 as u64,
952 cache_creation_input_tokens: default(),
953 cache_read_input_tokens: default(),
954 },
955 );
956 return Some((Some(Ok(completion_event)), state));
957 }
958 }
959 ConverseStreamOutput::MessageStop(message_stop) => {
960 let reason = match message_stop.stop_reason {
961 StopReason::ContentFiltered => {
962 LanguageModelCompletionEvent::Stop(
963 language_model::StopReason::EndTurn,
964 )
965 }
966 StopReason::EndTurn => {
967 LanguageModelCompletionEvent::Stop(
968 language_model::StopReason::EndTurn,
969 )
970 }
971 StopReason::GuardrailIntervened => {
972 LanguageModelCompletionEvent::Stop(
973 language_model::StopReason::EndTurn,
974 )
975 }
976 StopReason::MaxTokens => {
977 LanguageModelCompletionEvent::Stop(
978 language_model::StopReason::EndTurn,
979 )
980 }
981 StopReason::StopSequence => {
982 LanguageModelCompletionEvent::Stop(
983 language_model::StopReason::EndTurn,
984 )
985 }
986 StopReason::ToolUse => {
987 LanguageModelCompletionEvent::Stop(
988 language_model::StopReason::ToolUse,
989 )
990 }
991 _ => LanguageModelCompletionEvent::Stop(
992 language_model::StopReason::EndTurn,
993 ),
994 };
995 return Some((Some(Ok(reason)), state));
996 }
997 _ => {}
998 },
999
1000 Err(err) => return Some((Some(Err(anyhow!(err).into())), state)),
1001 }
1002 }
1003 None
1004 })
1005 .await
1006 .log_err()
1007 .flatten()
1008 }
1009 },
1010 )
1011 .filter_map(|event| async move { event })
1012}
1013
1014struct ConfigurationView {
1015 access_key_id_editor: Entity<Editor>,
1016 secret_access_key_editor: Entity<Editor>,
1017 session_token_editor: Entity<Editor>,
1018 region_editor: Entity<Editor>,
1019 state: gpui::Entity<State>,
1020 load_credentials_task: Option<Task<()>>,
1021}
1022
1023impl ConfigurationView {
1024 const PLACEHOLDER_ACCESS_KEY_ID_TEXT: &'static str = "XXXXXXXXXXXXXXXX";
1025 const PLACEHOLDER_SECRET_ACCESS_KEY_TEXT: &'static str =
1026 "XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX";
1027 const PLACEHOLDER_SESSION_TOKEN_TEXT: &'static str = "XXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXXX";
1028 const PLACEHOLDER_REGION: &'static str = "us-east-1";
1029
1030 fn new(state: gpui::Entity<State>, window: &mut Window, cx: &mut Context<Self>) -> Self {
1031 cx.observe(&state, |_, _, cx| {
1032 cx.notify();
1033 })
1034 .detach();
1035
1036 let load_credentials_task = Some(cx.spawn({
1037 let state = state.clone();
1038 async move |this, cx| {
1039 if let Some(task) = state
1040 .update(cx, |state, cx| state.authenticate(cx))
1041 .log_err()
1042 {
1043 // We don't log an error, because "not signed in" is also an error.
1044 let _ = task.await;
1045 }
1046 this.update(cx, |this, cx| {
1047 this.load_credentials_task = None;
1048 cx.notify();
1049 })
1050 .log_err();
1051 }
1052 }));
1053
1054 Self {
1055 access_key_id_editor: cx.new(|cx| {
1056 let mut editor = Editor::single_line(window, cx);
1057 editor.set_placeholder_text(Self::PLACEHOLDER_ACCESS_KEY_ID_TEXT, cx);
1058 editor
1059 }),
1060 secret_access_key_editor: cx.new(|cx| {
1061 let mut editor = Editor::single_line(window, cx);
1062 editor.set_placeholder_text(Self::PLACEHOLDER_SECRET_ACCESS_KEY_TEXT, cx);
1063 editor
1064 }),
1065 session_token_editor: cx.new(|cx| {
1066 let mut editor = Editor::single_line(window, cx);
1067 editor.set_placeholder_text(Self::PLACEHOLDER_SESSION_TOKEN_TEXT, cx);
1068 editor
1069 }),
1070 region_editor: cx.new(|cx| {
1071 let mut editor = Editor::single_line(window, cx);
1072 editor.set_placeholder_text(Self::PLACEHOLDER_REGION, cx);
1073 editor
1074 }),
1075 state,
1076 load_credentials_task,
1077 }
1078 }
1079
1080 fn save_credentials(
1081 &mut self,
1082 _: &menu::Confirm,
1083 _window: &mut Window,
1084 cx: &mut Context<Self>,
1085 ) {
1086 let access_key_id = self
1087 .access_key_id_editor
1088 .read(cx)
1089 .text(cx)
1090 .to_string()
1091 .trim()
1092 .to_string();
1093 let secret_access_key = self
1094 .secret_access_key_editor
1095 .read(cx)
1096 .text(cx)
1097 .to_string()
1098 .trim()
1099 .to_string();
1100 let session_token = self
1101 .session_token_editor
1102 .read(cx)
1103 .text(cx)
1104 .to_string()
1105 .trim()
1106 .to_string();
1107 let session_token = if session_token.is_empty() {
1108 None
1109 } else {
1110 Some(session_token)
1111 };
1112 let region = self
1113 .region_editor
1114 .read(cx)
1115 .text(cx)
1116 .to_string()
1117 .trim()
1118 .to_string();
1119 let region = if region.is_empty() {
1120 "us-east-1".to_string()
1121 } else {
1122 region
1123 };
1124
1125 let state = self.state.clone();
1126 cx.spawn(async move |_, cx| {
1127 state
1128 .update(cx, |state, cx| {
1129 let credentials: BedrockCredentials = BedrockCredentials {
1130 region: region.clone(),
1131 access_key_id: access_key_id.clone(),
1132 secret_access_key: secret_access_key.clone(),
1133 session_token: session_token.clone(),
1134 };
1135
1136 state.set_credentials(credentials, cx)
1137 })?
1138 .await
1139 })
1140 .detach_and_log_err(cx);
1141 }
1142
1143 fn reset_credentials(&mut self, window: &mut Window, cx: &mut Context<Self>) {
1144 self.access_key_id_editor
1145 .update(cx, |editor, cx| editor.set_text("", window, cx));
1146 self.secret_access_key_editor
1147 .update(cx, |editor, cx| editor.set_text("", window, cx));
1148 self.session_token_editor
1149 .update(cx, |editor, cx| editor.set_text("", window, cx));
1150 self.region_editor
1151 .update(cx, |editor, cx| editor.set_text("", window, cx));
1152
1153 let state = self.state.clone();
1154 cx.spawn(async move |_, cx| {
1155 state
1156 .update(cx, |state, cx| state.reset_credentials(cx))?
1157 .await
1158 })
1159 .detach_and_log_err(cx);
1160 }
1161
1162 fn make_text_style(&self, cx: &Context<Self>) -> TextStyle {
1163 let settings = ThemeSettings::get_global(cx);
1164 TextStyle {
1165 color: cx.theme().colors().text,
1166 font_family: settings.ui_font.family.clone(),
1167 font_features: settings.ui_font.features.clone(),
1168 font_fallbacks: settings.ui_font.fallbacks.clone(),
1169 font_size: rems(0.875).into(),
1170 font_weight: settings.ui_font.weight,
1171 font_style: FontStyle::Normal,
1172 line_height: relative(1.3),
1173 background_color: None,
1174 underline: None,
1175 strikethrough: None,
1176 white_space: WhiteSpace::Normal,
1177 text_overflow: None,
1178 text_align: Default::default(),
1179 line_clamp: None,
1180 }
1181 }
1182
1183 fn make_input_styles(&self, cx: &Context<Self>) -> Div {
1184 let bg_color = cx.theme().colors().editor_background;
1185 let border_color = cx.theme().colors().border;
1186
1187 h_flex()
1188 .w_full()
1189 .px_2()
1190 .py_1()
1191 .bg(bg_color)
1192 .border_1()
1193 .border_color(border_color)
1194 .rounded_sm()
1195 }
1196
1197 fn should_render_editor(&self, cx: &Context<Self>) -> bool {
1198 self.state.read(cx).is_authenticated()
1199 }
1200}
1201
1202impl Render for ConfigurationView {
1203 fn render(&mut self, _window: &mut Window, cx: &mut Context<Self>) -> impl IntoElement {
1204 let env_var_set = self.state.read(cx).credentials_from_env;
1205 let bedrock_settings = self.state.read(cx).settings.as_ref();
1206 let bedrock_method = bedrock_settings
1207 .as_ref()
1208 .and_then(|s| s.authentication_method.clone());
1209
1210 if self.load_credentials_task.is_some() {
1211 return div().child(Label::new("Loading credentials...")).into_any();
1212 }
1213
1214 if self.should_render_editor(cx) {
1215 return h_flex()
1216 .mt_1()
1217 .p_1()
1218 .justify_between()
1219 .rounded_md()
1220 .border_1()
1221 .border_color(cx.theme().colors().border)
1222 .bg(cx.theme().colors().background)
1223 .child(
1224 h_flex()
1225 .gap_1()
1226 .child(Icon::new(IconName::Check).color(Color::Success))
1227 .child(Label::new(if env_var_set {
1228 format!("Access Key ID is set in {ZED_BEDROCK_ACCESS_KEY_ID_VAR}, Secret Key is set in {ZED_BEDROCK_SECRET_ACCESS_KEY_VAR}, Region is set in {ZED_BEDROCK_REGION_VAR} environment variables.")
1229 } else {
1230 match bedrock_method {
1231 Some(BedrockAuthMethod::Automatic) => "You are using automatic credentials".into(),
1232 Some(BedrockAuthMethod::NamedProfile) => {
1233 "You are using named profile".into()
1234 },
1235 Some(BedrockAuthMethod::SingleSignOn) => "You are using a single sign on profile".into(),
1236 None => "You are using static credentials".into(),
1237 }
1238 })),
1239 )
1240 .child(
1241 Button::new("reset-key", "Reset Key")
1242 .icon(Some(IconName::Trash))
1243 .icon_size(IconSize::Small)
1244 .icon_position(IconPosition::Start)
1245 .disabled(env_var_set || bedrock_method.is_some())
1246 .when(env_var_set, |this| {
1247 this.tooltip(Tooltip::text(format!("To reset your credentials, unset the {ZED_BEDROCK_ACCESS_KEY_ID_VAR}, {ZED_BEDROCK_SECRET_ACCESS_KEY_VAR}, and {ZED_BEDROCK_REGION_VAR} environment variables.")))
1248 })
1249 .when(bedrock_method.is_some(), |this| {
1250 this.tooltip(Tooltip::text("You cannot reset credentials as they're being derived, check Zed settings to understand how"))
1251 })
1252 .on_click(cx.listener(|this, _, window, cx| this.reset_credentials(window, cx))),
1253 )
1254 .into_any();
1255 }
1256
1257 v_flex()
1258 .size_full()
1259 .on_action(cx.listener(ConfigurationView::save_credentials))
1260 .child(Label::new("To use Zed's assistant with Bedrock, you can set a custom authentication strategy through the settings.json, or use static credentials."))
1261 .child(Label::new("But, to access models on AWS, you need to:").mt_1())
1262 .child(
1263 List::new()
1264 .child(
1265 InstructionListItem::new(
1266 "Grant permissions to the strategy you'll use according to the:",
1267 Some("Prerequisites"),
1268 Some("https://docs.aws.amazon.com/bedrock/latest/userguide/inference-prereq.html"),
1269 )
1270 )
1271 .child(
1272 InstructionListItem::new(
1273 "Select the models you would like access to:",
1274 Some("Bedrock Model Catalog"),
1275 Some("https://us-east-1.console.aws.amazon.com/bedrock/home?region=us-east-1#/modelaccess"),
1276 )
1277 )
1278 )
1279 .child(self.render_static_credentials_ui(cx))
1280 .child(self.render_common_fields(cx))
1281 .child(
1282 Label::new(
1283 format!("You can also assign the {ZED_BEDROCK_ACCESS_KEY_ID_VAR}, {ZED_BEDROCK_SECRET_ACCESS_KEY_VAR} AND {ZED_BEDROCK_REGION_VAR} environment variables and restart Zed."),
1284 )
1285 .size(LabelSize::Small)
1286 .color(Color::Muted)
1287 .my_1(),
1288 )
1289 .child(
1290 Label::new(
1291 format!("Optionally, if your environment uses AWS CLI profiles, you can set {ZED_AWS_PROFILE_VAR}; if it requires a custom endpoint, you can set {ZED_AWS_ENDPOINT_VAR}; and if it requires a Session Token, you can set {ZED_BEDROCK_SESSION_TOKEN_VAR}."),
1292 )
1293 .size(LabelSize::Small)
1294 .color(Color::Muted),
1295 )
1296 .into_any()
1297 }
1298}
1299
1300impl ConfigurationView {
1301 fn render_access_key_id_editor(&self, cx: &mut Context<Self>) -> impl IntoElement {
1302 let text_style = self.make_text_style(cx);
1303
1304 EditorElement::new(
1305 &self.access_key_id_editor,
1306 EditorStyle {
1307 background: cx.theme().colors().editor_background,
1308 local_player: cx.theme().players().local(),
1309 text: text_style,
1310 ..Default::default()
1311 },
1312 )
1313 }
1314
1315 fn render_secret_key_editor(&self, cx: &mut Context<Self>) -> impl IntoElement {
1316 let text_style = self.make_text_style(cx);
1317
1318 EditorElement::new(
1319 &self.secret_access_key_editor,
1320 EditorStyle {
1321 background: cx.theme().colors().editor_background,
1322 local_player: cx.theme().players().local(),
1323 text: text_style,
1324 ..Default::default()
1325 },
1326 )
1327 }
1328
1329 fn render_session_token_editor(&self, cx: &mut Context<Self>) -> impl IntoElement {
1330 let text_style = self.make_text_style(cx);
1331
1332 EditorElement::new(
1333 &self.session_token_editor,
1334 EditorStyle {
1335 background: cx.theme().colors().editor_background,
1336 local_player: cx.theme().players().local(),
1337 text: text_style,
1338 ..Default::default()
1339 },
1340 )
1341 }
1342
1343 fn render_region_editor(&self, cx: &mut Context<Self>) -> impl IntoElement {
1344 let text_style = self.make_text_style(cx);
1345
1346 EditorElement::new(
1347 &self.region_editor,
1348 EditorStyle {
1349 background: cx.theme().colors().editor_background,
1350 local_player: cx.theme().players().local(),
1351 text: text_style,
1352 ..Default::default()
1353 },
1354 )
1355 }
1356
1357 fn render_static_credentials_ui(&self, cx: &mut Context<Self>) -> AnyElement {
1358 v_flex()
1359 .my_2()
1360 .gap_1p5()
1361 .child(
1362 Label::new("Static Keys")
1363 .size(LabelSize::Default)
1364 .weight(FontWeight::BOLD),
1365 )
1366 .child(
1367 Label::new(
1368 "This method uses your AWS access key ID and secret access key directly.",
1369 )
1370 )
1371 .child(
1372 List::new()
1373 .child(InstructionListItem::new(
1374 "Create an IAM user in the AWS console with programmatic access",
1375 Some("IAM Console"),
1376 Some("https://us-east-1.console.aws.amazon.com/iam/home?region=us-east-1#/users"),
1377 ))
1378 .child(InstructionListItem::new(
1379 "Attach the necessary Bedrock permissions to this ",
1380 Some("user"),
1381 Some("https://docs.aws.amazon.com/bedrock/latest/userguide/inference-prereq.html"),
1382 ))
1383 .child(InstructionListItem::text_only(
1384 "Copy the access key ID and secret access key when provided",
1385 ))
1386 .child(InstructionListItem::text_only(
1387 "Enter these credentials below",
1388 )),
1389 )
1390 .child(
1391 v_flex()
1392 .gap_0p5()
1393 .child(Label::new("Access Key ID").size(LabelSize::Small))
1394 .child(
1395 self.make_input_styles(cx)
1396 .child(self.render_access_key_id_editor(cx)),
1397 ),
1398 )
1399 .child(
1400 v_flex()
1401 .gap_0p5()
1402 .child(Label::new("Secret Access Key").size(LabelSize::Small))
1403 .child(self.make_input_styles(cx).child(self.render_secret_key_editor(cx))),
1404 )
1405 .child(
1406 v_flex()
1407 .gap_0p5()
1408 .child(Label::new("Session Token (Optional)").size(LabelSize::Small))
1409 .child(
1410 self.make_input_styles(cx)
1411 .child(self.render_session_token_editor(cx)),
1412 ),
1413 )
1414 .into_any_element()
1415 }
1416
1417 fn render_common_fields(&self, cx: &mut Context<Self>) -> AnyElement {
1418 v_flex()
1419 .gap_0p5()
1420 .child(Label::new("Region").size(LabelSize::Small))
1421 .child(
1422 self.make_input_styles(cx)
1423 .child(self.render_region_editor(cx)),
1424 )
1425 .into_any_element()
1426 }
1427}