1use anyhow::{Result, anyhow, bail};
2use futures::{AsyncBufReadExt, AsyncReadExt, StreamExt, io::BufReader, stream::BoxStream};
3use http_client::{AsyncBody, HttpClient, Method, Request as HttpRequest};
4use serde::{Deserialize, Serialize};
5
6pub const API_URL: &str = "https://generativelanguage.googleapis.com";
7
8pub async fn stream_generate_content(
9 client: &dyn HttpClient,
10 api_url: &str,
11 api_key: &str,
12 mut request: GenerateContentRequest,
13) -> Result<BoxStream<'static, Result<GenerateContentResponse>>> {
14 if request.contents.is_empty() {
15 bail!("Request must contain at least one content item");
16 }
17
18 if let Some(user_content) = request
19 .contents
20 .iter()
21 .find(|content| content.role == Role::User)
22 {
23 if user_content.parts.is_empty() {
24 bail!("User content must contain at least one part");
25 }
26 }
27
28 let uri = format!(
29 "{api_url}/v1beta/models/{model}:streamGenerateContent?alt=sse&key={api_key}",
30 model = request.model
31 );
32 request.model.clear();
33
34 let request_builder = HttpRequest::builder()
35 .method(Method::POST)
36 .uri(uri)
37 .header("Content-Type", "application/json");
38
39 let request = request_builder.body(AsyncBody::from(serde_json::to_string(&request)?))?;
40 let mut response = client.send(request).await?;
41 if response.status().is_success() {
42 let reader = BufReader::new(response.into_body());
43 Ok(reader
44 .lines()
45 .filter_map(|line| async move {
46 match line {
47 Ok(line) => {
48 if let Some(line) = line.strip_prefix("data: ") {
49 match serde_json::from_str(line) {
50 Ok(response) => Some(Ok(response)),
51 Err(error) => Some(Err(anyhow!(error))),
52 }
53 } else {
54 None
55 }
56 }
57 Err(error) => Some(Err(anyhow!(error))),
58 }
59 })
60 .boxed())
61 } else {
62 let mut text = String::new();
63 response.body_mut().read_to_string(&mut text).await?;
64 Err(anyhow!(
65 "error during streamGenerateContent, status code: {:?}, body: {}",
66 response.status(),
67 text
68 ))
69 }
70}
71
72pub async fn count_tokens(
73 client: &dyn HttpClient,
74 api_url: &str,
75 api_key: &str,
76 request: CountTokensRequest,
77) -> Result<CountTokensResponse> {
78 let uri = format!(
79 "{}/v1beta/models/gemini-pro:countTokens?key={}",
80 api_url, api_key
81 );
82 let request = serde_json::to_string(&request)?;
83
84 let request_builder = HttpRequest::builder()
85 .method(Method::POST)
86 .uri(&uri)
87 .header("Content-Type", "application/json");
88
89 let http_request = request_builder.body(AsyncBody::from(request))?;
90 let mut response = client.send(http_request).await?;
91 let mut text = String::new();
92 response.body_mut().read_to_string(&mut text).await?;
93 if response.status().is_success() {
94 Ok(serde_json::from_str::<CountTokensResponse>(&text)?)
95 } else {
96 Err(anyhow!(
97 "error during countTokens, status code: {:?}, body: {}",
98 response.status(),
99 text
100 ))
101 }
102}
103
104#[derive(Debug, Serialize, Deserialize)]
105pub enum Task {
106 #[serde(rename = "generateContent")]
107 GenerateContent,
108 #[serde(rename = "streamGenerateContent")]
109 StreamGenerateContent,
110 #[serde(rename = "countTokens")]
111 CountTokens,
112 #[serde(rename = "embedContent")]
113 EmbedContent,
114 #[serde(rename = "batchEmbedContents")]
115 BatchEmbedContents,
116}
117
118#[derive(Debug, Serialize, Deserialize)]
119#[serde(rename_all = "camelCase")]
120pub struct GenerateContentRequest {
121 #[serde(default, skip_serializing_if = "String::is_empty")]
122 pub model: String,
123 pub contents: Vec<Content>,
124 pub system_instruction: Option<SystemInstruction>,
125 pub generation_config: Option<GenerationConfig>,
126 pub safety_settings: Option<Vec<SafetySetting>>,
127 #[serde(skip_serializing_if = "Option::is_none")]
128 pub tools: Option<Vec<Tool>>,
129 #[serde(skip_serializing_if = "Option::is_none")]
130 pub tool_config: Option<ToolConfig>,
131}
132
133#[derive(Debug, Serialize, Deserialize)]
134#[serde(rename_all = "camelCase")]
135pub struct GenerateContentResponse {
136 pub candidates: Option<Vec<GenerateContentCandidate>>,
137 pub prompt_feedback: Option<PromptFeedback>,
138 pub usage_metadata: Option<UsageMetadata>,
139}
140
141#[derive(Debug, Serialize, Deserialize)]
142#[serde(rename_all = "camelCase")]
143pub struct GenerateContentCandidate {
144 pub index: Option<usize>,
145 pub content: Content,
146 pub finish_reason: Option<String>,
147 pub finish_message: Option<String>,
148 pub safety_ratings: Option<Vec<SafetyRating>>,
149 pub citation_metadata: Option<CitationMetadata>,
150}
151
152#[derive(Debug, Serialize, Deserialize)]
153#[serde(rename_all = "camelCase")]
154pub struct Content {
155 pub parts: Vec<Part>,
156 pub role: Role,
157}
158
159#[derive(Debug, Serialize, Deserialize)]
160#[serde(rename_all = "camelCase")]
161pub struct SystemInstruction {
162 pub parts: Vec<Part>,
163}
164
165#[derive(Debug, PartialEq, Deserialize, Serialize)]
166#[serde(rename_all = "camelCase")]
167pub enum Role {
168 User,
169 Model,
170}
171
172#[derive(Debug, Serialize, Deserialize)]
173#[serde(untagged)]
174pub enum Part {
175 TextPart(TextPart),
176 InlineDataPart(InlineDataPart),
177 FunctionCallPart(FunctionCallPart),
178 FunctionResponsePart(FunctionResponsePart),
179}
180
181#[derive(Debug, Serialize, Deserialize)]
182#[serde(rename_all = "camelCase")]
183pub struct TextPart {
184 pub text: String,
185}
186
187#[derive(Debug, Serialize, Deserialize)]
188#[serde(rename_all = "camelCase")]
189pub struct InlineDataPart {
190 pub inline_data: GenerativeContentBlob,
191}
192
193#[derive(Debug, Serialize, Deserialize)]
194#[serde(rename_all = "camelCase")]
195pub struct GenerativeContentBlob {
196 pub mime_type: String,
197 pub data: String,
198}
199
200#[derive(Debug, Serialize, Deserialize)]
201#[serde(rename_all = "camelCase")]
202pub struct FunctionCallPart {
203 pub function_call: FunctionCall,
204}
205
206#[derive(Debug, Serialize, Deserialize)]
207#[serde(rename_all = "camelCase")]
208pub struct FunctionResponsePart {
209 pub function_response: FunctionResponse,
210}
211
212#[derive(Debug, Serialize, Deserialize)]
213#[serde(rename_all = "camelCase")]
214pub struct CitationSource {
215 pub start_index: Option<usize>,
216 pub end_index: Option<usize>,
217 pub uri: Option<String>,
218 pub license: Option<String>,
219}
220
221#[derive(Debug, Serialize, Deserialize)]
222#[serde(rename_all = "camelCase")]
223pub struct CitationMetadata {
224 pub citation_sources: Vec<CitationSource>,
225}
226
227#[derive(Debug, Serialize, Deserialize)]
228#[serde(rename_all = "camelCase")]
229pub struct PromptFeedback {
230 pub block_reason: Option<String>,
231 pub safety_ratings: Vec<SafetyRating>,
232 pub block_reason_message: Option<String>,
233}
234
235#[derive(Debug, Serialize, Deserialize, Default)]
236#[serde(rename_all = "camelCase")]
237pub struct UsageMetadata {
238 pub prompt_token_count: Option<usize>,
239 pub cached_content_token_count: Option<usize>,
240 pub candidates_token_count: Option<usize>,
241 pub tool_use_prompt_token_count: Option<usize>,
242 pub thoughts_token_count: Option<usize>,
243 pub total_token_count: Option<usize>,
244}
245
246#[derive(Debug, Deserialize, Serialize)]
247#[serde(rename_all = "camelCase")]
248pub struct GenerationConfig {
249 pub candidate_count: Option<usize>,
250 pub stop_sequences: Option<Vec<String>>,
251 pub max_output_tokens: Option<usize>,
252 pub temperature: Option<f64>,
253 pub top_p: Option<f64>,
254 pub top_k: Option<usize>,
255}
256
257#[derive(Debug, Serialize, Deserialize)]
258#[serde(rename_all = "camelCase")]
259pub struct SafetySetting {
260 pub category: HarmCategory,
261 pub threshold: HarmBlockThreshold,
262}
263
264#[derive(Debug, Serialize, Deserialize)]
265pub enum HarmCategory {
266 #[serde(rename = "HARM_CATEGORY_UNSPECIFIED")]
267 Unspecified,
268 #[serde(rename = "HARM_CATEGORY_DEROGATORY")]
269 Derogatory,
270 #[serde(rename = "HARM_CATEGORY_TOXICITY")]
271 Toxicity,
272 #[serde(rename = "HARM_CATEGORY_VIOLENCE")]
273 Violence,
274 #[serde(rename = "HARM_CATEGORY_SEXUAL")]
275 Sexual,
276 #[serde(rename = "HARM_CATEGORY_MEDICAL")]
277 Medical,
278 #[serde(rename = "HARM_CATEGORY_DANGEROUS")]
279 Dangerous,
280 #[serde(rename = "HARM_CATEGORY_HARASSMENT")]
281 Harassment,
282 #[serde(rename = "HARM_CATEGORY_HATE_SPEECH")]
283 HateSpeech,
284 #[serde(rename = "HARM_CATEGORY_SEXUALLY_EXPLICIT")]
285 SexuallyExplicit,
286 #[serde(rename = "HARM_CATEGORY_DANGEROUS_CONTENT")]
287 DangerousContent,
288}
289
290#[derive(Debug, Serialize, Deserialize)]
291pub enum HarmBlockThreshold {
292 #[serde(rename = "HARM_BLOCK_THRESHOLD_UNSPECIFIED")]
293 Unspecified,
294 #[serde(rename = "BLOCK_LOW_AND_ABOVE")]
295 BlockLowAndAbove,
296 #[serde(rename = "BLOCK_MEDIUM_AND_ABOVE")]
297 BlockMediumAndAbove,
298 #[serde(rename = "BLOCK_ONLY_HIGH")]
299 BlockOnlyHigh,
300 #[serde(rename = "BLOCK_NONE")]
301 BlockNone,
302}
303
304#[derive(Debug, Serialize, Deserialize)]
305#[serde(rename_all = "SCREAMING_SNAKE_CASE")]
306pub enum HarmProbability {
307 #[serde(rename = "HARM_PROBABILITY_UNSPECIFIED")]
308 Unspecified,
309 Negligible,
310 Low,
311 Medium,
312 High,
313}
314
315#[derive(Debug, Serialize, Deserialize)]
316#[serde(rename_all = "camelCase")]
317pub struct SafetyRating {
318 pub category: HarmCategory,
319 pub probability: HarmProbability,
320}
321
322#[derive(Debug, Serialize, Deserialize)]
323#[serde(rename_all = "camelCase")]
324pub struct CountTokensRequest {
325 pub contents: Vec<Content>,
326}
327
328#[derive(Debug, Serialize, Deserialize)]
329#[serde(rename_all = "camelCase")]
330pub struct CountTokensResponse {
331 pub total_tokens: usize,
332}
333
334#[derive(Debug, Serialize, Deserialize)]
335pub struct FunctionCall {
336 pub name: String,
337 pub args: serde_json::Value,
338}
339
340#[derive(Debug, Serialize, Deserialize)]
341pub struct FunctionResponse {
342 pub name: String,
343 pub response: serde_json::Value,
344}
345
346#[derive(Debug, Serialize, Deserialize)]
347#[serde(rename_all = "camelCase")]
348pub struct Tool {
349 pub function_declarations: Vec<FunctionDeclaration>,
350}
351
352#[derive(Debug, Serialize, Deserialize)]
353#[serde(rename_all = "camelCase")]
354pub struct ToolConfig {
355 pub function_calling_config: FunctionCallingConfig,
356}
357
358#[derive(Debug, Serialize, Deserialize)]
359#[serde(rename_all = "camelCase")]
360pub struct FunctionCallingConfig {
361 pub mode: FunctionCallingMode,
362 #[serde(skip_serializing_if = "Option::is_none")]
363 pub allowed_function_names: Option<Vec<String>>,
364}
365
366#[derive(Debug, Serialize, Deserialize)]
367#[serde(rename_all = "lowercase")]
368pub enum FunctionCallingMode {
369 Auto,
370 Any,
371 None,
372}
373
374#[derive(Debug, Serialize, Deserialize)]
375pub struct FunctionDeclaration {
376 pub name: String,
377 pub description: String,
378 pub parameters: serde_json::Value,
379}
380
381#[cfg_attr(feature = "schemars", derive(schemars::JsonSchema))]
382#[derive(Clone, Default, Debug, Deserialize, Serialize, PartialEq, Eq, strum::EnumIter)]
383pub enum Model {
384 #[serde(rename = "gemini-1.5-pro")]
385 Gemini15Pro,
386 #[serde(rename = "gemini-1.5-flash")]
387 Gemini15Flash,
388 #[serde(rename = "gemini-2.0-pro-exp")]
389 Gemini20Pro,
390 #[serde(rename = "gemini-2.0-flash")]
391 #[default]
392 Gemini20Flash,
393 #[serde(rename = "gemini-2.0-flash-thinking-exp")]
394 Gemini20FlashThinking,
395 #[serde(rename = "gemini-2.0-flash-lite-preview")]
396 Gemini20FlashLite,
397 #[serde(rename = "gemini-2.5-pro-exp-03-25")]
398 Gemini25ProExp0325,
399 #[serde(rename = "gemini-2.5-pro-preview-03-25")]
400 Gemini25ProPreview0325,
401 #[serde(rename = "gemini-2.5-flash-preview-04-17")]
402 Gemini25FlashPreview0417,
403 #[serde(rename = "custom")]
404 Custom {
405 name: String,
406 /// The name displayed in the UI, such as in the assistant panel model dropdown menu.
407 display_name: Option<String>,
408 max_tokens: usize,
409 },
410}
411
412impl Model {
413 pub fn default_fast() -> Model {
414 Model::Gemini15Flash
415 }
416
417 pub fn id(&self) -> &str {
418 match self {
419 Model::Gemini15Pro => "gemini-1.5-pro",
420 Model::Gemini15Flash => "gemini-1.5-flash",
421 Model::Gemini20Pro => "gemini-2.0-pro-exp",
422 Model::Gemini20Flash => "gemini-2.0-flash",
423 Model::Gemini20FlashThinking => "gemini-2.0-flash-thinking-exp",
424 Model::Gemini20FlashLite => "gemini-2.0-flash-lite-preview",
425 Model::Gemini25ProExp0325 => "gemini-2.5-pro-exp-03-25",
426 Model::Gemini25ProPreview0325 => "gemini-2.5-pro-preview-03-25",
427 Model::Gemini25FlashPreview0417 => "gemini-2.5-flash-preview-04-17",
428 Model::Custom { name, .. } => name,
429 }
430 }
431
432 pub fn display_name(&self) -> &str {
433 match self {
434 Model::Gemini15Pro => "Gemini 1.5 Pro",
435 Model::Gemini15Flash => "Gemini 1.5 Flash",
436 Model::Gemini20Pro => "Gemini 2.0 Pro",
437 Model::Gemini20Flash => "Gemini 2.0 Flash",
438 Model::Gemini20FlashThinking => "Gemini 2.0 Flash Thinking",
439 Model::Gemini20FlashLite => "Gemini 2.0 Flash Lite",
440 Model::Gemini25ProExp0325 => "Gemini 2.5 Pro Exp",
441 Model::Gemini25ProPreview0325 => "Gemini 2.5 Pro Preview",
442 Model::Gemini25FlashPreview0417 => "Gemini 2.5 Flash Preview",
443 Self::Custom {
444 name, display_name, ..
445 } => display_name.as_ref().unwrap_or(name),
446 }
447 }
448
449 pub fn max_token_count(&self) -> usize {
450 match self {
451 Model::Gemini15Pro => 2_000_000,
452 Model::Gemini15Flash => 1_000_000,
453 Model::Gemini20Pro => 2_000_000,
454 Model::Gemini20Flash => 1_000_000,
455 Model::Gemini20FlashThinking => 1_000_000,
456 Model::Gemini20FlashLite => 1_000_000,
457 Model::Gemini25ProExp0325 => 1_000_000,
458 Model::Gemini25ProPreview0325 => 1_000_000,
459 Model::Gemini25FlashPreview0417 => 1_000_000,
460 Model::Custom { max_tokens, .. } => *max_tokens,
461 }
462 }
463}
464
465impl std::fmt::Display for Model {
466 fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
467 write!(f, "{}", self.id())
468 }
469}