Skip to main content

multimodal/
multimodal.rs

1use gemini_client_api::gemini::ask::Gemini;
2use gemini_client_api::gemini::types::sessions::Session;
3use gemini_client_api::gemini::utils::MarkdownToParts;
4use std::env;
5
6#[tokio::test]
7async fn raw_multimodal() {
8    use gemini_client_api::gemini::types::request::InlineData;
9
10    let mut session = Session::new(6);
11    let api_key = std::env::var("GEMINI_API_KEY").expect("GEMINI_API_KEY must be set");
12    let ai = Gemini::new(api_key, "gemini-2.5-flash", None);
13
14    session.ask("What is there in this pdf")
15        .ask(InlineData::from_url("https://bitmesra.ac.in/UploadedDocuments/admingo/files/221225_List%20of%20Holiday_2026_26.pdf").await.unwrap());
16
17    let response = ai.ask(&mut session).await.unwrap();
18    println!("\nGemini: {}", response.get_chat().get_text_no_think(""));
19}
20
21#[tokio::main]
22async fn main() {
23    let mut session = Session::new(6);
24    let api_key = env::var("GEMINI_API_KEY").expect("GEMINI_API_KEY must be set");
25    let ai = Gemini::new(api_key, "gemini-2.5-flash", None);
26
27    // Use MarkdownToParts to easily parse a string with image/file markers
28    // It supports both URLs and local file paths!
29    let content = "Describe this image: ![](https://avatars.githubusercontent.com/u/140788315?v=4)";
30    println!("Processing: {}", content);
31
32    let parts = MarkdownToParts::new(content, |_| mime::IMAGE_PNG)
33        .await
34        .process();
35
36    let response = ai.ask(session.ask_parts(parts)).await.unwrap();
37
38    println!("\nGemini: {}", response.get_chat().get_text_no_think(""));
39}