Struct MoESGBT

Source

pub struct MoESGBT<L: Loss = SquaredLoss> { /* private fields */ }

Available on crate feature alloc only.

Expand description

Streaming Mixture of Experts over SGBT ensembles.

Combines K independent SGBT<L> experts with a learned linear softmax gating network. The gate is trained online via SGD to route samples to the expert with the lowest loss, while all experts (or the top-k in hard gating mode) are trained on each incoming sample.

Generic over L: Loss so the expert loss function is monomorphized. The default is SquaredLoss for regression tasks.

§Gate Architecture

The gate is a single linear layer: z_k = W_k · x + b_k followed by softmax. Weights are lazily initialized to zeros on the first sample (since the feature dimensionality is not known at construction time). The gate learns via cross-entropy gradient descent against the one-hot indicator of the best expert per sample.

Struct MoESGBT Copy item path

§Gate Architecture

Implementations§

impl MoESGBT<SquaredLoss>

pub fn new(config: SGBTConfig, n_experts: usize) -> Self

§Panics

impl<L: Loss + Clone> MoESGBT<L>

pub fn with_loss(config: SGBTConfig, loss: L, n_experts: usize) -> Self

§Panics

pub fn with_gating( config: SGBTConfig, loss: L, n_experts: usize, gating_mode: GatingMode, gate_lr: f64, ) -> Self

§Panics

impl<L: Loss> MoESGBT<L>

pub fn gating_probabilities(&self, features: &[f64]) -> Vec<f64>

pub fn train_one(&mut self, sample: &impl Observation)

pub fn train_batch<O: Observation>(&mut self, samples: &[O])

pub fn predict(&self, features: &[f64]) -> f64

pub fn predict_with_gating(&self, features: &[f64]) -> (f64, Vec<f64>)

pub fn expert_predictions(&self, features: &[f64]) -> Vec<f64>

pub fn n_experts(&self) -> usize

pub fn n_samples_seen(&self) -> u64

pub fn experts(&self) -> &[SGBT<L>]

pub fn expert(&self, idx: usize) -> &SGBT<L>

§Panics

pub fn reset(&mut self)

Trait Implementations§

impl<L: Loss + Clone> Clone for MoESGBT<L>

fn clone(&self) -> Self

fn clone_from(&mut self, source: &Self)

impl<L: Loss> Debug for MoESGBT<L>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<L: Loss> StreamingLearner for MoESGBT<L>

fn train_one(&mut self, features: &[f64], target: f64, weight: f64)

fn predict(&self, features: &[f64]) -> f64

fn n_samples_seen(&self) -> u64

fn reset(&mut self)

fn train(&mut self, features: &[f64], target: f64)

fn predict_batch(&self, feature_matrix: &[&[f64]]) -> Vec<f64>

Auto Trait Implementations§

impl<L> Freeze for MoESGBT<L>where L: Freeze,

impl<L = SquaredLoss> !RefUnwindSafe for MoESGBT<L>

impl<L> Send for MoESGBT<L>

impl<L> Sync for MoESGBT<L>

impl<L> Unpin for MoESGBT<L>where L: Unpin,

impl<L> UnsafeUnpin for MoESGBT<L>where L: UnsafeUnpin,

impl<L = SquaredLoss> !UnwindSafe for MoESGBT<L>

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct MoESGBT

impl<L> Freeze for MoESGBT<L>
where L: Freeze,

impl<L> Unpin for MoESGBT<L>
where L: Unpin,

impl<L> UnsafeUnpin for MoESGBT<L>
where L: UnsafeUnpin,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,