1 2 3 4 5 6
//! Idefics3 multimodal model implementation. //! //! Vision-language model components for multimodal embedding generation. pub mod model; pub mod tensor_processing;