//! Input types for multimodal model forward passes.
use Runtime;
use Tensor;
/// Input for multimodal model forward pass.
///
/// Distinguishes between text-only and multimodal inputs so the model
/// can skip encoder processing when no images/audio are present.