1use anyhow::{Result, anyhow, bail};
2use futures::{AsyncBufReadExt, AsyncReadExt, StreamExt, io::BufReader, stream::BoxStream};
3use http_client::{AsyncBody, HttpClient, Method, Request as HttpRequest};
4use serde::{Deserialize, Serialize};
5
6pub const API_URL: &str = "https://generativelanguage.googleapis.com";
7
8pub async fn stream_generate_content(
9 client: &dyn HttpClient,
10 api_url: &str,
11 api_key: &str,
12 mut request: GenerateContentRequest,
13) -> Result<BoxStream<'static, Result<GenerateContentResponse>>> {
14 if request.contents.is_empty() {
15 bail!("Request must contain at least one content item");
16 }
17
18 if let Some(user_content) = request
19 .contents
20 .iter()
21 .find(|content| content.role == Role::User)
22 {
23 if user_content.parts.is_empty() {
24 bail!("User content must contain at least one part");
25 }
26 }
27
28 let uri = format!(
29 "{api_url}/v1beta/models/{model}:streamGenerateContent?alt=sse&key={api_key}",
30 model = request.model
31 );
32 request.model.clear();
33
34 let request_builder = HttpRequest::builder()
35 .method(Method::POST)
36 .uri(uri)
37 .header("Content-Type", "application/json");
38
39 let request = request_builder.body(AsyncBody::from(serde_json::to_string(&request)?))?;
40 let mut response = client.send(request).await?;
41 if response.status().is_success() {
42 let reader = BufReader::new(response.into_body());
43 Ok(reader
44 .lines()
45 .filter_map(|line| async move {
46 match line {
47 Ok(line) => {
48 if let Some(line) = line.strip_prefix("data: ") {
49 match serde_json::from_str(line) {
50 Ok(response) => Some(Ok(response)),
51 Err(error) => Some(Err(anyhow!(format!(
52 "Error parsing JSON: {:?}\n{:?}",
53 error, line
54 )))),
55 }
56 } else {
57 None
58 }
59 }
60 Err(error) => Some(Err(anyhow!(error))),
61 }
62 })
63 .boxed())
64 } else {
65 let mut text = String::new();
66 response.body_mut().read_to_string(&mut text).await?;
67 Err(anyhow!(
68 "error during streamGenerateContent, status code: {:?}, body: {}",
69 response.status(),
70 text
71 ))
72 }
73}
74
75pub async fn count_tokens(
76 client: &dyn HttpClient,
77 api_url: &str,
78 api_key: &str,
79 request: CountTokensRequest,
80) -> Result<CountTokensResponse> {
81 let uri = format!(
82 "{}/v1beta/models/gemini-pro:countTokens?key={}",
83 api_url, api_key
84 );
85 let request = serde_json::to_string(&request)?;
86
87 let request_builder = HttpRequest::builder()
88 .method(Method::POST)
89 .uri(&uri)
90 .header("Content-Type", "application/json");
91
92 let http_request = request_builder.body(AsyncBody::from(request))?;
93 let mut response = client.send(http_request).await?;
94 let mut text = String::new();
95 response.body_mut().read_to_string(&mut text).await?;
96 if response.status().is_success() {
97 Ok(serde_json::from_str::<CountTokensResponse>(&text)?)
98 } else {
99 Err(anyhow!(
100 "error during countTokens, status code: {:?}, body: {}",
101 response.status(),
102 text
103 ))
104 }
105}
106
107#[derive(Debug, Serialize, Deserialize)]
108pub enum Task {
109 #[serde(rename = "generateContent")]
110 GenerateContent,
111 #[serde(rename = "streamGenerateContent")]
112 StreamGenerateContent,
113 #[serde(rename = "countTokens")]
114 CountTokens,
115 #[serde(rename = "embedContent")]
116 EmbedContent,
117 #[serde(rename = "batchEmbedContents")]
118 BatchEmbedContents,
119}
120
121#[derive(Debug, Serialize, Deserialize)]
122#[serde(rename_all = "camelCase")]
123pub struct GenerateContentRequest {
124 #[serde(default, skip_serializing_if = "String::is_empty")]
125 pub model: String,
126 pub contents: Vec<Content>,
127 pub system_instruction: Option<SystemInstruction>,
128 pub generation_config: Option<GenerationConfig>,
129 pub safety_settings: Option<Vec<SafetySetting>>,
130 #[serde(skip_serializing_if = "Option::is_none")]
131 pub tools: Option<Vec<Tool>>,
132 #[serde(skip_serializing_if = "Option::is_none")]
133 pub tool_config: Option<ToolConfig>,
134}
135
136#[derive(Debug, Serialize, Deserialize)]
137#[serde(rename_all = "camelCase")]
138pub struct GenerateContentResponse {
139 pub candidates: Option<Vec<GenerateContentCandidate>>,
140 pub prompt_feedback: Option<PromptFeedback>,
141 pub usage_metadata: Option<UsageMetadata>,
142}
143
144#[derive(Debug, Serialize, Deserialize)]
145#[serde(rename_all = "camelCase")]
146pub struct GenerateContentCandidate {
147 pub index: Option<usize>,
148 pub content: Content,
149 pub finish_reason: Option<String>,
150 pub finish_message: Option<String>,
151 pub safety_ratings: Option<Vec<SafetyRating>>,
152 pub citation_metadata: Option<CitationMetadata>,
153}
154
155#[derive(Debug, Serialize, Deserialize)]
156#[serde(rename_all = "camelCase")]
157pub struct Content {
158 #[serde(default)]
159 pub parts: Vec<Part>,
160 pub role: Role,
161}
162
163#[derive(Debug, Serialize, Deserialize)]
164#[serde(rename_all = "camelCase")]
165pub struct SystemInstruction {
166 pub parts: Vec<Part>,
167}
168
169#[derive(Debug, PartialEq, Deserialize, Serialize)]
170#[serde(rename_all = "camelCase")]
171pub enum Role {
172 User,
173 Model,
174}
175
176#[derive(Debug, Serialize, Deserialize)]
177#[serde(untagged)]
178pub enum Part {
179 TextPart(TextPart),
180 InlineDataPart(InlineDataPart),
181 FunctionCallPart(FunctionCallPart),
182 FunctionResponsePart(FunctionResponsePart),
183}
184
185#[derive(Debug, Serialize, Deserialize)]
186#[serde(rename_all = "camelCase")]
187pub struct TextPart {
188 pub text: String,
189}
190
191#[derive(Debug, Serialize, Deserialize)]
192#[serde(rename_all = "camelCase")]
193pub struct InlineDataPart {
194 pub inline_data: GenerativeContentBlob,
195}
196
197#[derive(Debug, Serialize, Deserialize)]
198#[serde(rename_all = "camelCase")]
199pub struct GenerativeContentBlob {
200 pub mime_type: String,
201 pub data: String,
202}
203
204#[derive(Debug, Serialize, Deserialize)]
205#[serde(rename_all = "camelCase")]
206pub struct FunctionCallPart {
207 pub function_call: FunctionCall,
208}
209
210#[derive(Debug, Serialize, Deserialize)]
211#[serde(rename_all = "camelCase")]
212pub struct FunctionResponsePart {
213 pub function_response: FunctionResponse,
214}
215
216#[derive(Debug, Serialize, Deserialize)]
217#[serde(rename_all = "camelCase")]
218pub struct CitationSource {
219 pub start_index: Option<usize>,
220 pub end_index: Option<usize>,
221 pub uri: Option<String>,
222 pub license: Option<String>,
223}
224
225#[derive(Debug, Serialize, Deserialize)]
226#[serde(rename_all = "camelCase")]
227pub struct CitationMetadata {
228 pub citation_sources: Vec<CitationSource>,
229}
230
231#[derive(Debug, Serialize, Deserialize)]
232#[serde(rename_all = "camelCase")]
233pub struct PromptFeedback {
234 pub block_reason: Option<String>,
235 pub safety_ratings: Vec<SafetyRating>,
236 pub block_reason_message: Option<String>,
237}
238
239#[derive(Debug, Serialize, Deserialize, Default)]
240#[serde(rename_all = "camelCase")]
241pub struct UsageMetadata {
242 pub prompt_token_count: Option<usize>,
243 pub cached_content_token_count: Option<usize>,
244 pub candidates_token_count: Option<usize>,
245 pub tool_use_prompt_token_count: Option<usize>,
246 pub thoughts_token_count: Option<usize>,
247 pub total_token_count: Option<usize>,
248}
249
250#[derive(Debug, Deserialize, Serialize)]
251#[serde(rename_all = "camelCase")]
252pub struct GenerationConfig {
253 pub candidate_count: Option<usize>,
254 pub stop_sequences: Option<Vec<String>>,
255 pub max_output_tokens: Option<usize>,
256 pub temperature: Option<f64>,
257 pub top_p: Option<f64>,
258 pub top_k: Option<usize>,
259}
260
261#[derive(Debug, Serialize, Deserialize)]
262#[serde(rename_all = "camelCase")]
263pub struct SafetySetting {
264 pub category: HarmCategory,
265 pub threshold: HarmBlockThreshold,
266}
267
268#[derive(Debug, Serialize, Deserialize)]
269pub enum HarmCategory {
270 #[serde(rename = "HARM_CATEGORY_UNSPECIFIED")]
271 Unspecified,
272 #[serde(rename = "HARM_CATEGORY_DEROGATORY")]
273 Derogatory,
274 #[serde(rename = "HARM_CATEGORY_TOXICITY")]
275 Toxicity,
276 #[serde(rename = "HARM_CATEGORY_VIOLENCE")]
277 Violence,
278 #[serde(rename = "HARM_CATEGORY_SEXUAL")]
279 Sexual,
280 #[serde(rename = "HARM_CATEGORY_MEDICAL")]
281 Medical,
282 #[serde(rename = "HARM_CATEGORY_DANGEROUS")]
283 Dangerous,
284 #[serde(rename = "HARM_CATEGORY_HARASSMENT")]
285 Harassment,
286 #[serde(rename = "HARM_CATEGORY_HATE_SPEECH")]
287 HateSpeech,
288 #[serde(rename = "HARM_CATEGORY_SEXUALLY_EXPLICIT")]
289 SexuallyExplicit,
290 #[serde(rename = "HARM_CATEGORY_DANGEROUS_CONTENT")]
291 DangerousContent,
292}
293
294#[derive(Debug, Serialize, Deserialize)]
295pub enum HarmBlockThreshold {
296 #[serde(rename = "HARM_BLOCK_THRESHOLD_UNSPECIFIED")]
297 Unspecified,
298 #[serde(rename = "BLOCK_LOW_AND_ABOVE")]
299 BlockLowAndAbove,
300 #[serde(rename = "BLOCK_MEDIUM_AND_ABOVE")]
301 BlockMediumAndAbove,
302 #[serde(rename = "BLOCK_ONLY_HIGH")]
303 BlockOnlyHigh,
304 #[serde(rename = "BLOCK_NONE")]
305 BlockNone,
306}
307
308#[derive(Debug, Serialize, Deserialize)]
309#[serde(rename_all = "SCREAMING_SNAKE_CASE")]
310pub enum HarmProbability {
311 #[serde(rename = "HARM_PROBABILITY_UNSPECIFIED")]
312 Unspecified,
313 Negligible,
314 Low,
315 Medium,
316 High,
317}
318
319#[derive(Debug, Serialize, Deserialize)]
320#[serde(rename_all = "camelCase")]
321pub struct SafetyRating {
322 pub category: HarmCategory,
323 pub probability: HarmProbability,
324}
325
326#[derive(Debug, Serialize, Deserialize)]
327#[serde(rename_all = "camelCase")]
328pub struct CountTokensRequest {
329 pub contents: Vec<Content>,
330}
331
332#[derive(Debug, Serialize, Deserialize)]
333#[serde(rename_all = "camelCase")]
334pub struct CountTokensResponse {
335 pub total_tokens: usize,
336}
337
338#[derive(Debug, Serialize, Deserialize)]
339pub struct FunctionCall {
340 pub name: String,
341 pub args: serde_json::Value,
342}
343
344#[derive(Debug, Serialize, Deserialize)]
345pub struct FunctionResponse {
346 pub name: String,
347 pub response: serde_json::Value,
348}
349
350#[derive(Debug, Serialize, Deserialize)]
351#[serde(rename_all = "camelCase")]
352pub struct Tool {
353 pub function_declarations: Vec<FunctionDeclaration>,
354}
355
356#[derive(Debug, Serialize, Deserialize)]
357#[serde(rename_all = "camelCase")]
358pub struct ToolConfig {
359 pub function_calling_config: FunctionCallingConfig,
360}
361
362#[derive(Debug, Serialize, Deserialize)]
363#[serde(rename_all = "camelCase")]
364pub struct FunctionCallingConfig {
365 pub mode: FunctionCallingMode,
366 #[serde(skip_serializing_if = "Option::is_none")]
367 pub allowed_function_names: Option<Vec<String>>,
368}
369
370#[derive(Debug, Serialize, Deserialize)]
371#[serde(rename_all = "lowercase")]
372pub enum FunctionCallingMode {
373 Auto,
374 Any,
375 None,
376}
377
378#[derive(Debug, Serialize, Deserialize)]
379pub struct FunctionDeclaration {
380 pub name: String,
381 pub description: String,
382 pub parameters: serde_json::Value,
383}
384
385#[cfg_attr(feature = "schemars", derive(schemars::JsonSchema))]
386#[derive(Clone, Default, Debug, Deserialize, Serialize, PartialEq, Eq, strum::EnumIter)]
387pub enum Model {
388 #[serde(rename = "gemini-1.5-pro")]
389 Gemini15Pro,
390 #[serde(rename = "gemini-1.5-flash")]
391 Gemini15Flash,
392 #[serde(rename = "gemini-2.0-pro-exp")]
393 Gemini20Pro,
394 #[serde(rename = "gemini-2.0-flash")]
395 #[default]
396 Gemini20Flash,
397 #[serde(rename = "gemini-2.0-flash-thinking-exp")]
398 Gemini20FlashThinking,
399 #[serde(rename = "gemini-2.0-flash-lite-preview")]
400 Gemini20FlashLite,
401 #[serde(rename = "gemini-2.5-pro-exp-03-25")]
402 Gemini25ProExp0325,
403 #[serde(rename = "gemini-2.5-pro-preview-03-25")]
404 Gemini25ProPreview0325,
405 #[serde(rename = "gemini-2.5-flash-preview-04-17")]
406 Gemini25FlashPreview0417,
407 #[serde(rename = "custom")]
408 Custom {
409 name: String,
410 /// The name displayed in the UI, such as in the assistant panel model dropdown menu.
411 display_name: Option<String>,
412 max_tokens: usize,
413 },
414}
415
416impl Model {
417 pub fn default_fast() -> Model {
418 Model::Gemini15Flash
419 }
420
421 pub fn id(&self) -> &str {
422 match self {
423 Model::Gemini15Pro => "gemini-1.5-pro",
424 Model::Gemini15Flash => "gemini-1.5-flash",
425 Model::Gemini20Pro => "gemini-2.0-pro-exp",
426 Model::Gemini20Flash => "gemini-2.0-flash",
427 Model::Gemini20FlashThinking => "gemini-2.0-flash-thinking-exp",
428 Model::Gemini20FlashLite => "gemini-2.0-flash-lite-preview",
429 Model::Gemini25ProExp0325 => "gemini-2.5-pro-exp-03-25",
430 Model::Gemini25ProPreview0325 => "gemini-2.5-pro-preview-03-25",
431 Model::Gemini25FlashPreview0417 => "gemini-2.5-flash-preview-04-17",
432 Model::Custom { name, .. } => name,
433 }
434 }
435
436 pub fn display_name(&self) -> &str {
437 match self {
438 Model::Gemini15Pro => "Gemini 1.5 Pro",
439 Model::Gemini15Flash => "Gemini 1.5 Flash",
440 Model::Gemini20Pro => "Gemini 2.0 Pro",
441 Model::Gemini20Flash => "Gemini 2.0 Flash",
442 Model::Gemini20FlashThinking => "Gemini 2.0 Flash Thinking",
443 Model::Gemini20FlashLite => "Gemini 2.0 Flash Lite",
444 Model::Gemini25ProExp0325 => "Gemini 2.5 Pro Exp",
445 Model::Gemini25ProPreview0325 => "Gemini 2.5 Pro Preview",
446 Model::Gemini25FlashPreview0417 => "Gemini 2.5 Flash Preview",
447 Self::Custom {
448 name, display_name, ..
449 } => display_name.as_ref().unwrap_or(name),
450 }
451 }
452
453 pub fn max_token_count(&self) -> usize {
454 const ONE_MILLION: usize = 1_048_576;
455 const TWO_MILLION: usize = 2_097_152;
456 match self {
457 Model::Gemini15Pro => TWO_MILLION,
458 Model::Gemini15Flash => ONE_MILLION,
459 Model::Gemini20Pro => TWO_MILLION,
460 Model::Gemini20Flash => ONE_MILLION,
461 Model::Gemini20FlashThinking => ONE_MILLION,
462 Model::Gemini20FlashLite => ONE_MILLION,
463 Model::Gemini25ProExp0325 => ONE_MILLION,
464 Model::Gemini25ProPreview0325 => ONE_MILLION,
465 Model::Gemini25FlashPreview0417 => ONE_MILLION,
466 Model::Custom { max_tokens, .. } => *max_tokens,
467 }
468 }
469}
470
471impl std::fmt::Display for Model {
472 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
473 write!(f, "{}", self.id())
474 }
475}