1use anyhow::{Result, anyhow, bail};
2use futures::{AsyncBufReadExt, AsyncReadExt, StreamExt, io::BufReader, stream::BoxStream};
3use http_client::{AsyncBody, HttpClient, Method, Request as HttpRequest};
4use serde::{Deserialize, Serialize};
5
6pub const API_URL: &str = "https://generativelanguage.googleapis.com";
7
8pub async fn stream_generate_content(
9 client: &dyn HttpClient,
10 api_url: &str,
11 api_key: &str,
12 mut request: GenerateContentRequest,
13) -> Result<BoxStream<'static, Result<GenerateContentResponse>>> {
14 if request.contents.is_empty() {
15 bail!("Request must contain at least one content item");
16 }
17
18 if let Some(user_content) = request
19 .contents
20 .iter()
21 .find(|content| content.role == Role::User)
22 {
23 if user_content.parts.is_empty() {
24 bail!("User content must contain at least one part");
25 }
26 }
27
28 let uri = format!(
29 "{api_url}/v1beta/models/{model}:streamGenerateContent?alt=sse&key={api_key}",
30 model = request.model
31 );
32 request.model.clear();
33
34 let request_builder = HttpRequest::builder()
35 .method(Method::POST)
36 .uri(uri)
37 .header("Content-Type", "application/json");
38
39 let request = request_builder.body(AsyncBody::from(serde_json::to_string(&request)?))?;
40 let mut response = client.send(request).await?;
41 if response.status().is_success() {
42 let reader = BufReader::new(response.into_body());
43 Ok(reader
44 .lines()
45 .filter_map(|line| async move {
46 match line {
47 Ok(line) => {
48 if let Some(line) = line.strip_prefix("data: ") {
49 match serde_json::from_str(line) {
50 Ok(response) => Some(Ok(response)),
51 Err(error) => Some(Err(anyhow!(format!(
52 "Error parsing JSON: {:?}\n{:?}",
53 error, line
54 )))),
55 }
56 } else {
57 None
58 }
59 }
60 Err(error) => Some(Err(anyhow!(error))),
61 }
62 })
63 .boxed())
64 } else {
65 let mut text = String::new();
66 response.body_mut().read_to_string(&mut text).await?;
67 Err(anyhow!(
68 "error during streamGenerateContent, status code: {:?}, body: {}",
69 response.status(),
70 text
71 ))
72 }
73}
74
75pub async fn count_tokens(
76 client: &dyn HttpClient,
77 api_url: &str,
78 api_key: &str,
79 request: CountTokensRequest,
80) -> Result<CountTokensResponse> {
81 let uri = format!(
82 "{}/v1beta/models/gemini-pro:countTokens?key={}",
83 api_url, api_key
84 );
85 let request = serde_json::to_string(&request)?;
86
87 let request_builder = HttpRequest::builder()
88 .method(Method::POST)
89 .uri(&uri)
90 .header("Content-Type", "application/json");
91
92 let http_request = request_builder.body(AsyncBody::from(request))?;
93 let mut response = client.send(http_request).await?;
94 let mut text = String::new();
95 response.body_mut().read_to_string(&mut text).await?;
96 if response.status().is_success() {
97 Ok(serde_json::from_str::<CountTokensResponse>(&text)?)
98 } else {
99 Err(anyhow!(
100 "error during countTokens, status code: {:?}, body: {}",
101 response.status(),
102 text
103 ))
104 }
105}
106
107#[derive(Debug, Serialize, Deserialize)]
108pub enum Task {
109 #[serde(rename = "generateContent")]
110 GenerateContent,
111 #[serde(rename = "streamGenerateContent")]
112 StreamGenerateContent,
113 #[serde(rename = "countTokens")]
114 CountTokens,
115 #[serde(rename = "embedContent")]
116 EmbedContent,
117 #[serde(rename = "batchEmbedContents")]
118 BatchEmbedContents,
119}
120
121#[derive(Debug, Serialize, Deserialize)]
122#[serde(rename_all = "camelCase")]
123pub struct GenerateContentRequest {
124 #[serde(default, skip_serializing_if = "String::is_empty")]
125 pub model: String,
126 pub contents: Vec<Content>,
127 #[serde(skip_serializing_if = "Option::is_none")]
128 pub system_instruction: Option<SystemInstruction>,
129 #[serde(skip_serializing_if = "Option::is_none")]
130 pub generation_config: Option<GenerationConfig>,
131 #[serde(skip_serializing_if = "Option::is_none")]
132 pub safety_settings: Option<Vec<SafetySetting>>,
133 #[serde(skip_serializing_if = "Option::is_none")]
134 pub tools: Option<Vec<Tool>>,
135 #[serde(skip_serializing_if = "Option::is_none")]
136 pub tool_config: Option<ToolConfig>,
137}
138
139#[derive(Debug, Serialize, Deserialize)]
140#[serde(rename_all = "camelCase")]
141pub struct GenerateContentResponse {
142 #[serde(skip_serializing_if = "Option::is_none")]
143 pub candidates: Option<Vec<GenerateContentCandidate>>,
144 #[serde(skip_serializing_if = "Option::is_none")]
145 pub prompt_feedback: Option<PromptFeedback>,
146 #[serde(skip_serializing_if = "Option::is_none")]
147 pub usage_metadata: Option<UsageMetadata>,
148}
149
150#[derive(Debug, Serialize, Deserialize)]
151#[serde(rename_all = "camelCase")]
152pub struct GenerateContentCandidate {
153 #[serde(skip_serializing_if = "Option::is_none")]
154 pub index: Option<usize>,
155 pub content: Content,
156 #[serde(skip_serializing_if = "Option::is_none")]
157 pub finish_reason: Option<String>,
158 #[serde(skip_serializing_if = "Option::is_none")]
159 pub finish_message: Option<String>,
160 #[serde(skip_serializing_if = "Option::is_none")]
161 pub safety_ratings: Option<Vec<SafetyRating>>,
162 #[serde(skip_serializing_if = "Option::is_none")]
163 pub citation_metadata: Option<CitationMetadata>,
164}
165
166#[derive(Debug, Serialize, Deserialize)]
167#[serde(rename_all = "camelCase")]
168pub struct Content {
169 #[serde(default)]
170 pub parts: Vec<Part>,
171 pub role: Role,
172}
173
174#[derive(Debug, Serialize, Deserialize)]
175#[serde(rename_all = "camelCase")]
176pub struct SystemInstruction {
177 pub parts: Vec<Part>,
178}
179
180#[derive(Debug, PartialEq, Deserialize, Serialize)]
181#[serde(rename_all = "camelCase")]
182pub enum Role {
183 User,
184 Model,
185}
186
187#[derive(Debug, Serialize, Deserialize)]
188#[serde(untagged)]
189pub enum Part {
190 TextPart(TextPart),
191 InlineDataPart(InlineDataPart),
192 FunctionCallPart(FunctionCallPart),
193 FunctionResponsePart(FunctionResponsePart),
194}
195
196#[derive(Debug, Serialize, Deserialize)]
197#[serde(rename_all = "camelCase")]
198pub struct TextPart {
199 pub text: String,
200}
201
202#[derive(Debug, Serialize, Deserialize)]
203#[serde(rename_all = "camelCase")]
204pub struct InlineDataPart {
205 pub inline_data: GenerativeContentBlob,
206}
207
208#[derive(Debug, Serialize, Deserialize)]
209#[serde(rename_all = "camelCase")]
210pub struct GenerativeContentBlob {
211 pub mime_type: String,
212 pub data: String,
213}
214
215#[derive(Debug, Serialize, Deserialize)]
216#[serde(rename_all = "camelCase")]
217pub struct FunctionCallPart {
218 pub function_call: FunctionCall,
219}
220
221#[derive(Debug, Serialize, Deserialize)]
222#[serde(rename_all = "camelCase")]
223pub struct FunctionResponsePart {
224 pub function_response: FunctionResponse,
225}
226
227#[derive(Debug, Serialize, Deserialize)]
228#[serde(rename_all = "camelCase")]
229pub struct CitationSource {
230 #[serde(skip_serializing_if = "Option::is_none")]
231 pub start_index: Option<usize>,
232 #[serde(skip_serializing_if = "Option::is_none")]
233 pub end_index: Option<usize>,
234 #[serde(skip_serializing_if = "Option::is_none")]
235 pub uri: Option<String>,
236 #[serde(skip_serializing_if = "Option::is_none")]
237 pub license: Option<String>,
238}
239
240#[derive(Debug, Serialize, Deserialize)]
241#[serde(rename_all = "camelCase")]
242pub struct CitationMetadata {
243 pub citation_sources: Vec<CitationSource>,
244}
245
246#[derive(Debug, Serialize, Deserialize)]
247#[serde(rename_all = "camelCase")]
248pub struct PromptFeedback {
249 #[serde(skip_serializing_if = "Option::is_none")]
250 pub block_reason: Option<String>,
251 pub safety_ratings: Vec<SafetyRating>,
252 #[serde(skip_serializing_if = "Option::is_none")]
253 pub block_reason_message: Option<String>,
254}
255
256#[derive(Debug, Serialize, Deserialize, Default)]
257#[serde(rename_all = "camelCase")]
258pub struct UsageMetadata {
259 #[serde(skip_serializing_if = "Option::is_none")]
260 pub prompt_token_count: Option<usize>,
261 #[serde(skip_serializing_if = "Option::is_none")]
262 pub cached_content_token_count: Option<usize>,
263 #[serde(skip_serializing_if = "Option::is_none")]
264 pub candidates_token_count: Option<usize>,
265 #[serde(skip_serializing_if = "Option::is_none")]
266 pub tool_use_prompt_token_count: Option<usize>,
267 #[serde(skip_serializing_if = "Option::is_none")]
268 pub thoughts_token_count: Option<usize>,
269 #[serde(skip_serializing_if = "Option::is_none")]
270 pub total_token_count: Option<usize>,
271}
272
273#[derive(Debug, Deserialize, Serialize)]
274#[serde(rename_all = "camelCase")]
275pub struct GenerationConfig {
276 #[serde(skip_serializing_if = "Option::is_none")]
277 pub candidate_count: Option<usize>,
278 #[serde(skip_serializing_if = "Option::is_none")]
279 pub stop_sequences: Option<Vec<String>>,
280 #[serde(skip_serializing_if = "Option::is_none")]
281 pub max_output_tokens: Option<usize>,
282 #[serde(skip_serializing_if = "Option::is_none")]
283 pub temperature: Option<f64>,
284 #[serde(skip_serializing_if = "Option::is_none")]
285 pub top_p: Option<f64>,
286 #[serde(skip_serializing_if = "Option::is_none")]
287 pub top_k: Option<usize>,
288}
289
290#[derive(Debug, Serialize, Deserialize)]
291#[serde(rename_all = "camelCase")]
292pub struct SafetySetting {
293 pub category: HarmCategory,
294 pub threshold: HarmBlockThreshold,
295}
296
297#[derive(Debug, Serialize, Deserialize)]
298pub enum HarmCategory {
299 #[serde(rename = "HARM_CATEGORY_UNSPECIFIED")]
300 Unspecified,
301 #[serde(rename = "HARM_CATEGORY_DEROGATORY")]
302 Derogatory,
303 #[serde(rename = "HARM_CATEGORY_TOXICITY")]
304 Toxicity,
305 #[serde(rename = "HARM_CATEGORY_VIOLENCE")]
306 Violence,
307 #[serde(rename = "HARM_CATEGORY_SEXUAL")]
308 Sexual,
309 #[serde(rename = "HARM_CATEGORY_MEDICAL")]
310 Medical,
311 #[serde(rename = "HARM_CATEGORY_DANGEROUS")]
312 Dangerous,
313 #[serde(rename = "HARM_CATEGORY_HARASSMENT")]
314 Harassment,
315 #[serde(rename = "HARM_CATEGORY_HATE_SPEECH")]
316 HateSpeech,
317 #[serde(rename = "HARM_CATEGORY_SEXUALLY_EXPLICIT")]
318 SexuallyExplicit,
319 #[serde(rename = "HARM_CATEGORY_DANGEROUS_CONTENT")]
320 DangerousContent,
321}
322
323#[derive(Debug, Serialize, Deserialize)]
324#[serde(rename_all = "SCREAMING_SNAKE_CASE")]
325pub enum HarmBlockThreshold {
326 #[serde(rename = "HARM_BLOCK_THRESHOLD_UNSPECIFIED")]
327 Unspecified,
328 BlockLowAndAbove,
329 BlockMediumAndAbove,
330 BlockOnlyHigh,
331 BlockNone,
332}
333
334#[derive(Debug, Serialize, Deserialize)]
335#[serde(rename_all = "SCREAMING_SNAKE_CASE")]
336pub enum HarmProbability {
337 #[serde(rename = "HARM_PROBABILITY_UNSPECIFIED")]
338 Unspecified,
339 Negligible,
340 Low,
341 Medium,
342 High,
343}
344
345#[derive(Debug, Serialize, Deserialize)]
346#[serde(rename_all = "camelCase")]
347pub struct SafetyRating {
348 pub category: HarmCategory,
349 pub probability: HarmProbability,
350}
351
352#[derive(Debug, Serialize, Deserialize)]
353#[serde(rename_all = "camelCase")]
354pub struct CountTokensRequest {
355 pub contents: Vec<Content>,
356}
357
358#[derive(Debug, Serialize, Deserialize)]
359#[serde(rename_all = "camelCase")]
360pub struct CountTokensResponse {
361 pub total_tokens: usize,
362}
363
364#[derive(Debug, Serialize, Deserialize)]
365pub struct FunctionCall {
366 pub name: String,
367 pub args: serde_json::Value,
368}
369
370#[derive(Debug, Serialize, Deserialize)]
371pub struct FunctionResponse {
372 pub name: String,
373 pub response: serde_json::Value,
374}
375
376#[derive(Debug, Serialize, Deserialize)]
377#[serde(rename_all = "camelCase")]
378pub struct Tool {
379 pub function_declarations: Vec<FunctionDeclaration>,
380}
381
382#[derive(Debug, Serialize, Deserialize)]
383#[serde(rename_all = "camelCase")]
384pub struct ToolConfig {
385 pub function_calling_config: FunctionCallingConfig,
386}
387
388#[derive(Debug, Serialize, Deserialize)]
389#[serde(rename_all = "camelCase")]
390pub struct FunctionCallingConfig {
391 pub mode: FunctionCallingMode,
392 #[serde(skip_serializing_if = "Option::is_none")]
393 pub allowed_function_names: Option<Vec<String>>,
394}
395
396#[derive(Debug, Serialize, Deserialize)]
397#[serde(rename_all = "lowercase")]
398pub enum FunctionCallingMode {
399 Auto,
400 Any,
401 None,
402}
403
404#[derive(Debug, Serialize, Deserialize)]
405pub struct FunctionDeclaration {
406 pub name: String,
407 pub description: String,
408 pub parameters: serde_json::Value,
409}
410
411#[cfg_attr(feature = "schemars", derive(schemars::JsonSchema))]
412#[derive(Clone, Default, Debug, Deserialize, Serialize, PartialEq, Eq, strum::EnumIter)]
413pub enum Model {
414 #[serde(rename = "gemini-1.5-pro")]
415 Gemini15Pro,
416 #[serde(rename = "gemini-1.5-flash")]
417 Gemini15Flash,
418 #[serde(rename = "gemini-2.0-pro-exp")]
419 Gemini20Pro,
420 #[serde(rename = "gemini-2.0-flash")]
421 #[default]
422 Gemini20Flash,
423 #[serde(rename = "gemini-2.0-flash-thinking-exp")]
424 Gemini20FlashThinking,
425 #[serde(rename = "gemini-2.0-flash-lite-preview")]
426 Gemini20FlashLite,
427 #[serde(rename = "gemini-2.5-pro-exp-03-25")]
428 Gemini25ProExp0325,
429 #[serde(rename = "gemini-2.5-pro-preview-03-25")]
430 Gemini25ProPreview0325,
431 #[serde(rename = "gemini-2.5-flash-preview-04-17")]
432 Gemini25FlashPreview0417,
433 #[serde(rename = "custom")]
434 Custom {
435 name: String,
436 /// The name displayed in the UI, such as in the assistant panel model dropdown menu.
437 display_name: Option<String>,
438 max_tokens: usize,
439 },
440}
441
442impl Model {
443 pub fn default_fast() -> Model {
444 Model::Gemini15Flash
445 }
446
447 pub fn id(&self) -> &str {
448 match self {
449 Model::Gemini15Pro => "gemini-1.5-pro",
450 Model::Gemini15Flash => "gemini-1.5-flash",
451 Model::Gemini20Pro => "gemini-2.0-pro-exp",
452 Model::Gemini20Flash => "gemini-2.0-flash",
453 Model::Gemini20FlashThinking => "gemini-2.0-flash-thinking-exp",
454 Model::Gemini20FlashLite => "gemini-2.0-flash-lite-preview",
455 Model::Gemini25ProExp0325 => "gemini-2.5-pro-exp-03-25",
456 Model::Gemini25ProPreview0325 => "gemini-2.5-pro-preview-03-25",
457 Model::Gemini25FlashPreview0417 => "gemini-2.5-flash-preview-04-17",
458 Model::Custom { name, .. } => name,
459 }
460 }
461
462 pub fn display_name(&self) -> &str {
463 match self {
464 Model::Gemini15Pro => "Gemini 1.5 Pro",
465 Model::Gemini15Flash => "Gemini 1.5 Flash",
466 Model::Gemini20Pro => "Gemini 2.0 Pro",
467 Model::Gemini20Flash => "Gemini 2.0 Flash",
468 Model::Gemini20FlashThinking => "Gemini 2.0 Flash Thinking",
469 Model::Gemini20FlashLite => "Gemini 2.0 Flash Lite",
470 Model::Gemini25ProExp0325 => "Gemini 2.5 Pro Exp",
471 Model::Gemini25ProPreview0325 => "Gemini 2.5 Pro Preview",
472 Model::Gemini25FlashPreview0417 => "Gemini 2.5 Flash Preview",
473 Self::Custom {
474 name, display_name, ..
475 } => display_name.as_ref().unwrap_or(name),
476 }
477 }
478
479 pub fn max_token_count(&self) -> usize {
480 const ONE_MILLION: usize = 1_048_576;
481 const TWO_MILLION: usize = 2_097_152;
482 match self {
483 Model::Gemini15Pro => TWO_MILLION,
484 Model::Gemini15Flash => ONE_MILLION,
485 Model::Gemini20Pro => TWO_MILLION,
486 Model::Gemini20Flash => ONE_MILLION,
487 Model::Gemini20FlashThinking => ONE_MILLION,
488 Model::Gemini20FlashLite => ONE_MILLION,
489 Model::Gemini25ProExp0325 => ONE_MILLION,
490 Model::Gemini25ProPreview0325 => ONE_MILLION,
491 Model::Gemini25FlashPreview0417 => ONE_MILLION,
492 Model::Custom { max_tokens, .. } => *max_tokens,
493 }
494 }
495}
496
497impl std::fmt::Display for Model {
498 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
499 write!(f, "{}", self.id())
500 }
501}