llm-multimodal 1.2.0

Multimodal processing for vision and other modalities
Documentation
pub mod error;
pub mod media;
pub mod registry;
pub mod tracker;
pub mod types;
pub mod vision;

pub use error::{MediaConnectorError, MultiModalError, MultiModalResult};
pub use media::{ImageFetchConfig, MediaConnector, MediaConnectorConfig, MediaSource};
pub use registry::{ModelMetadata, ModelProcessorSpec, ModelRegistry};
pub use tracker::{AsyncMultiModalTracker, TrackerOutput};
pub use types::{
    ChatContentPart, ImageDetail, ImageFrame, ImageSize, ImageSource, Modality, MultiModalData,
    MultiModalInputs, MultiModalTensor, MultiModalUUIDs, MultiModalValue, PlaceholderRange,
    PromptReplacement, TokenId, TrackedMedia,
};
// Re-export vision processing components
pub use vision::{
    ImagePreProcessor, ImageProcessorRegistry, LlavaNextProcessor, LlavaProcessor,
    ModelSpecificValue, PreProcessorConfig, PreprocessedImages, TransformError,
};