1use anyhow::Result;
2use mistralrs::{IsqType, TextMessageRole, VisionMessages, VisionModelBuilder};
3
4#[tokio::main]
5async fn main() -> Result<()> {
6 let model = VisionModelBuilder::new("google/gemma-3n-E4B-it")
7 .with_isq(IsqType::Q4K)
8 .with_logging()
9 .build()
10 .await?;
11
12 let bytes = match reqwest::blocking::get(
13 "https://cdn.britannica.com/45/5645-050-B9EC0205/head-treasure-flower-disk-flowers-inflorescence-ray.jpg",
14 ) {
15 Ok(http_resp) => http_resp.bytes()?.to_vec(),
16 Err(e) => anyhow::bail!(e),
17 };
18 let image = image::load_from_memory(&bytes)?;
19
20 let messages = VisionMessages::new().add_image_message(
21 TextMessageRole::User,
22 "What is depicted here? Please describe the scene in detail.",
23 vec![image],
24 &model,
25 )?;
26
27 let response = model.send_chat_request(messages).await?;
28
29 println!("{}", response.choices[0].message.content.as_ref().unwrap());
30 dbg!(
31 response.usage.avg_prompt_tok_per_sec,
32 response.usage.avg_compl_tok_per_sec
33 );
34
35 Ok(())
36}