llm-multimodal 1.7.0

Multimodal processing for vision and other modalities
Documentation
pub mod error;
pub mod hasher;
pub mod hub;
pub mod media;
pub mod registry;
pub mod tracker;
pub mod types;
pub mod vision;

pub use error::{MediaConnectorError, MultiModalError, MultiModalResult};
pub use media::{
    ImageFetchConfig, MediaConnector, MediaConnectorConfig, MediaSource, VideoFetchConfig,
};
pub use registry::{ModelMetadata, ModelProcessorSpec, ModelRegistry};
pub use tracker::{AsyncMultiModalTracker, TrackerOutput};
pub use types::{
    FieldLayout, ImageDetail, ImageFrame, ImageSize, ImageSource, MediaContentPart, Modality,
    MultiModalData, MultiModalUUIDs, PlaceholderRange, PromptReplacement, RgbFrameRef, TokenId,
    TrackedMedia, VideoClip, VideoSource,
};
// Re-export vision processing components
pub use vision::{
    LlavaNextProcessor, LlavaProcessor, ModelSpecificValue, PreProcessorConfig,
    PreprocessedEncoderInputs, TransformError, VisionPreProcessor, VisionProcessorRegistry,
};