1 2 3 4 5 6 7 8 9 10 11
//! Mixture of Experts (MoE) attention mechanisms //! //! This module provides MoE attention where different inputs route to specialized experts. pub mod expert; pub mod moe_attention; pub mod router; pub use expert::{Expert, ExpertType, HyperbolicExpert, LinearExpert, StandardExpert}; pub use moe_attention::{MoEAttention, MoEConfig}; pub use router::{LearnedRouter, Router, TopKRouting};