google_ai.rs

  1use anyhow::{Result, anyhow, bail};
  2use futures::{AsyncBufReadExt, AsyncReadExt, StreamExt, io::BufReader, stream::BoxStream};
  3use http_client::{AsyncBody, HttpClient, Method, Request as HttpRequest};
  4use serde::{Deserialize, Serialize};
  5
  6pub const API_URL: &str = "https://generativelanguage.googleapis.com";
  7
  8pub async fn stream_generate_content(
  9    client: &dyn HttpClient,
 10    api_url: &str,
 11    api_key: &str,
 12    mut request: GenerateContentRequest,
 13) -> Result<BoxStream<'static, Result<GenerateContentResponse>>> {
 14    if request.contents.is_empty() {
 15        bail!("Request must contain at least one content item");
 16    }
 17
 18    if let Some(user_content) = request
 19        .contents
 20        .iter()
 21        .find(|content| content.role == Role::User)
 22    {
 23        if user_content.parts.is_empty() {
 24            bail!("User content must contain at least one part");
 25        }
 26    }
 27
 28    let uri = format!(
 29        "{api_url}/v1beta/models/{model}:streamGenerateContent?alt=sse&key={api_key}",
 30        model = request.model
 31    );
 32    request.model.clear();
 33
 34    let request_builder = HttpRequest::builder()
 35        .method(Method::POST)
 36        .uri(uri)
 37        .header("Content-Type", "application/json");
 38
 39    let request = request_builder.body(AsyncBody::from(serde_json::to_string(&request)?))?;
 40    let mut response = client.send(request).await?;
 41    if response.status().is_success() {
 42        let reader = BufReader::new(response.into_body());
 43        Ok(reader
 44            .lines()
 45            .filter_map(|line| async move {
 46                match line {
 47                    Ok(line) => {
 48                        if let Some(line) = line.strip_prefix("data: ") {
 49                            match serde_json::from_str(line) {
 50                                Ok(response) => Some(Ok(response)),
 51                                Err(error) => Some(Err(anyhow!(error))),
 52                            }
 53                        } else {
 54                            None
 55                        }
 56                    }
 57                    Err(error) => Some(Err(anyhow!(error))),
 58                }
 59            })
 60            .boxed())
 61    } else {
 62        let mut text = String::new();
 63        response.body_mut().read_to_string(&mut text).await?;
 64        Err(anyhow!(
 65            "error during streamGenerateContent, status code: {:?}, body: {}",
 66            response.status(),
 67            text
 68        ))
 69    }
 70}
 71
 72pub async fn count_tokens(
 73    client: &dyn HttpClient,
 74    api_url: &str,
 75    api_key: &str,
 76    request: CountTokensRequest,
 77) -> Result<CountTokensResponse> {
 78    let uri = format!(
 79        "{}/v1beta/models/gemini-pro:countTokens?key={}",
 80        api_url, api_key
 81    );
 82    let request = serde_json::to_string(&request)?;
 83
 84    let request_builder = HttpRequest::builder()
 85        .method(Method::POST)
 86        .uri(&uri)
 87        .header("Content-Type", "application/json");
 88
 89    let http_request = request_builder.body(AsyncBody::from(request))?;
 90    let mut response = client.send(http_request).await?;
 91    let mut text = String::new();
 92    response.body_mut().read_to_string(&mut text).await?;
 93    if response.status().is_success() {
 94        Ok(serde_json::from_str::<CountTokensResponse>(&text)?)
 95    } else {
 96        Err(anyhow!(
 97            "error during countTokens, status code: {:?}, body: {}",
 98            response.status(),
 99            text
100        ))
101    }
102}
103
104#[derive(Debug, Serialize, Deserialize)]
105pub enum Task {
106    #[serde(rename = "generateContent")]
107    GenerateContent,
108    #[serde(rename = "streamGenerateContent")]
109    StreamGenerateContent,
110    #[serde(rename = "countTokens")]
111    CountTokens,
112    #[serde(rename = "embedContent")]
113    EmbedContent,
114    #[serde(rename = "batchEmbedContents")]
115    BatchEmbedContents,
116}
117
118#[derive(Debug, Serialize, Deserialize)]
119#[serde(rename_all = "camelCase")]
120pub struct GenerateContentRequest {
121    #[serde(default, skip_serializing_if = "String::is_empty")]
122    pub model: String,
123    pub contents: Vec<Content>,
124    pub system_instruction: Option<SystemInstruction>,
125    pub generation_config: Option<GenerationConfig>,
126    pub safety_settings: Option<Vec<SafetySetting>>,
127    #[serde(skip_serializing_if = "Option::is_none")]
128    pub tools: Option<Vec<Tool>>,
129    #[serde(skip_serializing_if = "Option::is_none")]
130    pub tool_config: Option<ToolConfig>,
131}
132
133#[derive(Debug, Serialize, Deserialize)]
134#[serde(rename_all = "camelCase")]
135pub struct GenerateContentResponse {
136    pub candidates: Option<Vec<GenerateContentCandidate>>,
137    pub prompt_feedback: Option<PromptFeedback>,
138    pub usage_metadata: Option<UsageMetadata>,
139}
140
141#[derive(Debug, Serialize, Deserialize)]
142#[serde(rename_all = "camelCase")]
143pub struct GenerateContentCandidate {
144    pub index: Option<usize>,
145    pub content: Content,
146    pub finish_reason: Option<String>,
147    pub finish_message: Option<String>,
148    pub safety_ratings: Option<Vec<SafetyRating>>,
149    pub citation_metadata: Option<CitationMetadata>,
150}
151
152#[derive(Debug, Serialize, Deserialize)]
153#[serde(rename_all = "camelCase")]
154pub struct Content {
155    pub parts: Vec<Part>,
156    pub role: Role,
157}
158
159#[derive(Debug, Serialize, Deserialize)]
160#[serde(rename_all = "camelCase")]
161pub struct SystemInstruction {
162    pub parts: Vec<Part>,
163}
164
165#[derive(Debug, PartialEq, Deserialize, Serialize)]
166#[serde(rename_all = "camelCase")]
167pub enum Role {
168    User,
169    Model,
170}
171
172#[derive(Debug, Serialize, Deserialize)]
173#[serde(untagged)]
174pub enum Part {
175    TextPart(TextPart),
176    InlineDataPart(InlineDataPart),
177    FunctionCallPart(FunctionCallPart),
178    FunctionResponsePart(FunctionResponsePart),
179}
180
181#[derive(Debug, Serialize, Deserialize)]
182#[serde(rename_all = "camelCase")]
183pub struct TextPart {
184    pub text: String,
185}
186
187#[derive(Debug, Serialize, Deserialize)]
188#[serde(rename_all = "camelCase")]
189pub struct InlineDataPart {
190    pub inline_data: GenerativeContentBlob,
191}
192
193#[derive(Debug, Serialize, Deserialize)]
194#[serde(rename_all = "camelCase")]
195pub struct GenerativeContentBlob {
196    pub mime_type: String,
197    pub data: String,
198}
199
200#[derive(Debug, Serialize, Deserialize)]
201#[serde(rename_all = "camelCase")]
202pub struct FunctionCallPart {
203    pub function_call: FunctionCall,
204}
205
206#[derive(Debug, Serialize, Deserialize)]
207#[serde(rename_all = "camelCase")]
208pub struct FunctionResponsePart {
209    pub function_response: FunctionResponse,
210}
211
212#[derive(Debug, Serialize, Deserialize)]
213#[serde(rename_all = "camelCase")]
214pub struct CitationSource {
215    pub start_index: Option<usize>,
216    pub end_index: Option<usize>,
217    pub uri: Option<String>,
218    pub license: Option<String>,
219}
220
221#[derive(Debug, Serialize, Deserialize)]
222#[serde(rename_all = "camelCase")]
223pub struct CitationMetadata {
224    pub citation_sources: Vec<CitationSource>,
225}
226
227#[derive(Debug, Serialize, Deserialize)]
228#[serde(rename_all = "camelCase")]
229pub struct PromptFeedback {
230    pub block_reason: Option<String>,
231    pub safety_ratings: Vec<SafetyRating>,
232    pub block_reason_message: Option<String>,
233}
234
235#[derive(Debug, Serialize, Deserialize, Default)]
236#[serde(rename_all = "camelCase")]
237pub struct UsageMetadata {
238    pub prompt_token_count: Option<usize>,
239    pub cached_content_token_count: Option<usize>,
240    pub candidates_token_count: Option<usize>,
241    pub tool_use_prompt_token_count: Option<usize>,
242    pub thoughts_token_count: Option<usize>,
243    pub total_token_count: Option<usize>,
244}
245
246#[derive(Debug, Deserialize, Serialize)]
247#[serde(rename_all = "camelCase")]
248pub struct GenerationConfig {
249    pub candidate_count: Option<usize>,
250    pub stop_sequences: Option<Vec<String>>,
251    pub max_output_tokens: Option<usize>,
252    pub temperature: Option<f64>,
253    pub top_p: Option<f64>,
254    pub top_k: Option<usize>,
255}
256
257#[derive(Debug, Serialize, Deserialize)]
258#[serde(rename_all = "camelCase")]
259pub struct SafetySetting {
260    pub category: HarmCategory,
261    pub threshold: HarmBlockThreshold,
262}
263
264#[derive(Debug, Serialize, Deserialize)]
265pub enum HarmCategory {
266    #[serde(rename = "HARM_CATEGORY_UNSPECIFIED")]
267    Unspecified,
268    #[serde(rename = "HARM_CATEGORY_DEROGATORY")]
269    Derogatory,
270    #[serde(rename = "HARM_CATEGORY_TOXICITY")]
271    Toxicity,
272    #[serde(rename = "HARM_CATEGORY_VIOLENCE")]
273    Violence,
274    #[serde(rename = "HARM_CATEGORY_SEXUAL")]
275    Sexual,
276    #[serde(rename = "HARM_CATEGORY_MEDICAL")]
277    Medical,
278    #[serde(rename = "HARM_CATEGORY_DANGEROUS")]
279    Dangerous,
280    #[serde(rename = "HARM_CATEGORY_HARASSMENT")]
281    Harassment,
282    #[serde(rename = "HARM_CATEGORY_HATE_SPEECH")]
283    HateSpeech,
284    #[serde(rename = "HARM_CATEGORY_SEXUALLY_EXPLICIT")]
285    SexuallyExplicit,
286    #[serde(rename = "HARM_CATEGORY_DANGEROUS_CONTENT")]
287    DangerousContent,
288}
289
290#[derive(Debug, Serialize, Deserialize)]
291pub enum HarmBlockThreshold {
292    #[serde(rename = "HARM_BLOCK_THRESHOLD_UNSPECIFIED")]
293    Unspecified,
294    #[serde(rename = "BLOCK_LOW_AND_ABOVE")]
295    BlockLowAndAbove,
296    #[serde(rename = "BLOCK_MEDIUM_AND_ABOVE")]
297    BlockMediumAndAbove,
298    #[serde(rename = "BLOCK_ONLY_HIGH")]
299    BlockOnlyHigh,
300    #[serde(rename = "BLOCK_NONE")]
301    BlockNone,
302}
303
304#[derive(Debug, Serialize, Deserialize)]
305#[serde(rename_all = "SCREAMING_SNAKE_CASE")]
306pub enum HarmProbability {
307    #[serde(rename = "HARM_PROBABILITY_UNSPECIFIED")]
308    Unspecified,
309    Negligible,
310    Low,
311    Medium,
312    High,
313}
314
315#[derive(Debug, Serialize, Deserialize)]
316#[serde(rename_all = "camelCase")]
317pub struct SafetyRating {
318    pub category: HarmCategory,
319    pub probability: HarmProbability,
320}
321
322#[derive(Debug, Serialize, Deserialize)]
323#[serde(rename_all = "camelCase")]
324pub struct CountTokensRequest {
325    pub contents: Vec<Content>,
326}
327
328#[derive(Debug, Serialize, Deserialize)]
329#[serde(rename_all = "camelCase")]
330pub struct CountTokensResponse {
331    pub total_tokens: usize,
332}
333
334#[derive(Debug, Serialize, Deserialize)]
335pub struct FunctionCall {
336    pub name: String,
337    pub args: serde_json::Value,
338}
339
340#[derive(Debug, Serialize, Deserialize)]
341pub struct FunctionResponse {
342    pub name: String,
343    pub response: serde_json::Value,
344}
345
346#[derive(Debug, Serialize, Deserialize)]
347#[serde(rename_all = "camelCase")]
348pub struct Tool {
349    pub function_declarations: Vec<FunctionDeclaration>,
350}
351
352#[derive(Debug, Serialize, Deserialize)]
353#[serde(rename_all = "camelCase")]
354pub struct ToolConfig {
355    pub function_calling_config: FunctionCallingConfig,
356}
357
358#[derive(Debug, Serialize, Deserialize)]
359#[serde(rename_all = "camelCase")]
360pub struct FunctionCallingConfig {
361    pub mode: FunctionCallingMode,
362    #[serde(skip_serializing_if = "Option::is_none")]
363    pub allowed_function_names: Option<Vec<String>>,
364}
365
366#[derive(Debug, Serialize, Deserialize)]
367#[serde(rename_all = "lowercase")]
368pub enum FunctionCallingMode {
369    Auto,
370    Any,
371    None,
372}
373
374#[derive(Debug, Serialize, Deserialize)]
375pub struct FunctionDeclaration {
376    pub name: String,
377    pub description: String,
378    pub parameters: serde_json::Value,
379}
380
381#[cfg_attr(feature = "schemars", derive(schemars::JsonSchema))]
382#[derive(Clone, Default, Debug, Deserialize, Serialize, PartialEq, Eq, strum::EnumIter)]
383pub enum Model {
384    #[serde(rename = "gemini-1.5-pro")]
385    Gemini15Pro,
386    #[serde(rename = "gemini-1.5-flash")]
387    Gemini15Flash,
388    #[serde(rename = "gemini-2.0-pro-exp")]
389    Gemini20Pro,
390    #[serde(rename = "gemini-2.0-flash")]
391    #[default]
392    Gemini20Flash,
393    #[serde(rename = "gemini-2.0-flash-thinking-exp")]
394    Gemini20FlashThinking,
395    #[serde(rename = "gemini-2.0-flash-lite-preview")]
396    Gemini20FlashLite,
397    #[serde(rename = "gemini-2.5-pro-exp-03-25")]
398    Gemini25ProExp0325,
399    #[serde(rename = "gemini-2.5-pro-preview-03-25")]
400    Gemini25ProPreview0325,
401    #[serde(rename = "gemini-2.5-flash-preview-04-17")]
402    Gemini25FlashPreview0417,
403    #[serde(rename = "custom")]
404    Custom {
405        name: String,
406        /// The name displayed in the UI, such as in the assistant panel model dropdown menu.
407        display_name: Option<String>,
408        max_tokens: usize,
409    },
410}
411
412impl Model {
413    pub fn default_fast() -> Model {
414        Model::Gemini15Flash
415    }
416
417    pub fn id(&self) -> &str {
418        match self {
419            Model::Gemini15Pro => "gemini-1.5-pro",
420            Model::Gemini15Flash => "gemini-1.5-flash",
421            Model::Gemini20Pro => "gemini-2.0-pro-exp",
422            Model::Gemini20Flash => "gemini-2.0-flash",
423            Model::Gemini20FlashThinking => "gemini-2.0-flash-thinking-exp",
424            Model::Gemini20FlashLite => "gemini-2.0-flash-lite-preview",
425            Model::Gemini25ProExp0325 => "gemini-2.5-pro-exp-03-25",
426            Model::Gemini25ProPreview0325 => "gemini-2.5-pro-preview-03-25",
427            Model::Gemini25FlashPreview0417 => "gemini-2.5-flash-preview-04-17",
428            Model::Custom { name, .. } => name,
429        }
430    }
431
432    pub fn display_name(&self) -> &str {
433        match self {
434            Model::Gemini15Pro => "Gemini 1.5 Pro",
435            Model::Gemini15Flash => "Gemini 1.5 Flash",
436            Model::Gemini20Pro => "Gemini 2.0 Pro",
437            Model::Gemini20Flash => "Gemini 2.0 Flash",
438            Model::Gemini20FlashThinking => "Gemini 2.0 Flash Thinking",
439            Model::Gemini20FlashLite => "Gemini 2.0 Flash Lite",
440            Model::Gemini25ProExp0325 => "Gemini 2.5 Pro Exp",
441            Model::Gemini25ProPreview0325 => "Gemini 2.5 Pro Preview",
442            Model::Gemini25FlashPreview0417 => "Gemini 2.5 Flash Preview",
443            Self::Custom {
444                name, display_name, ..
445            } => display_name.as_ref().unwrap_or(name),
446        }
447    }
448
449    pub fn max_token_count(&self) -> usize {
450        match self {
451            Model::Gemini15Pro => 2_000_000,
452            Model::Gemini15Flash => 1_000_000,
453            Model::Gemini20Pro => 2_000_000,
454            Model::Gemini20Flash => 1_000_000,
455            Model::Gemini20FlashThinking => 1_000_000,
456            Model::Gemini20FlashLite => 1_000_000,
457            Model::Gemini25ProExp0325 => 1_000_000,
458            Model::Gemini25ProPreview0325 => 1_000_000,
459            Model::Gemini25FlashPreview0417 => 1_000_000,
460            Model::Custom { max_tokens, .. } => *max_tokens,
461        }
462    }
463}
464
465impl std::fmt::Display for Model {
466    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
467        write!(f, "{}", self.id())
468    }
469}