Struct SaeAssignment

Source

pub struct SaeAssignment {
    pub logits: Array2<f64>,
    pub coords: Vec<LatentCoordValues>,
    pub mode: AssignmentMode,
    pub ungated: Vec<bool>,
    pub frozen_logits: Option<Array2<f64>>,
}

Expand description

Per-row latent assignment state.

The stored assignment parameter is logits; non-negative assignments are derived by row-wise softmax, independent IBP-MAP sigmoid active indicators, or JumpReLU gates. Softmax logits are canonicalized to the reference chart logits[K - 1] = 0, so the row-local Newton coordinates contain only the first K - 1 logits (0 coordinates for K = 1). Gate-style modes keep all K logits as identifiable scalar parameters. coords[k] holds t_{.,k} for atom k.

Fields§

§logits: Array2<f64>§coords: Vec<LatentCoordValues>§mode: AssignmentMode§ungated: Vec<bool>

#1026 — per-atom UNGATED flag (length K, default all-false). An ungated atom is the dense linear/background tier: its per-row gate is fixed at a_k ≡ 1 (it contributes γ_k(t_k) to EVERY row, unweighted), it is excluded from the other atoms’ gate (for the column-separable IBP / JumpReLU modes the remaining atoms are computed independently, so they are unaffected), and its logit is NOT a free parameter — its logit-JVP, sparsity-prior gradient/curvature, and softmax majorizer contributions are all zero, leaving its logit slot an inert (ridge-regularized) null direction in the per-row Newton block. This lets the linear tier carry FULL-RANK reconstructible variance (fitted = γ_ungated(x) + Σ_{gated} a_k·γ_k(x)) so a linear SAE can reach the rank-(K·d) PCA ceiling, while the gated curved atoms still add sparse structure on the residual (#1026 routing-bound finding).

§frozen_logits: Option<Array2<f64>>

#1033 — AMORTIZED / FROZEN routing. When Some, this (n, K) matrix is a ρ-INVARIANT predicted routing (the amortized x → logits map distilled from the frozen dictionary): the gates are computed from THESE logits instead of the free self.logits, and the logits are NOT optimized by the inner Newton (their gradient/curvature/prior contributions are zeroed, exactly as for Self::ungated). This is the generalization of an ungated atom from “pin the gate at 1” to “pin the gate at the predicted value”: it makes the per-row routing a fixed function of x + the frozen dictionary, so the outer ρ-search reuses ONE routing instead of re-solving per-row gates every outer eval — the n-independent-outer-loop lever (#1033). None is the historical free-logit path (bit-identical).

Struct SaeAssignment Copy item path

Fields§

Implementations§

impl SaeAssignment

pub fn new( logits: Array2<f64>, coords: Vec<LatentCoordValues>, temperature: f64, ) -> Result<Self, String>

pub fn with_mode( logits: Array2<f64>, coords: Vec<LatentCoordValues>, mode: AssignmentMode, ) -> Result<Self, String>

pub fn with_frozen_routing( self, predicted: Option<Array2<f64>>, ) -> Result<Self, String>

pub fn routing_is_frozen(&self) -> bool

pub fn freeze_routing_from_current_logits(self) -> Result<Self, String>

pub fn freeze_routing_in_place(&mut self) -> Result<(), String>

pub fn set_frozen_routing_in_place( &mut self, predicted: Array2<f64>, ) -> Result<(), String>

pub fn thaw_routing(&mut self)

pub fn with_ungated(self, flags: Vec<bool>) -> Result<Self, String>

pub fn has_ungated(&self) -> bool

pub fn n_obs(&self) -> usize

pub fn k_atoms(&self) -> usize

pub fn total_coord_dim(&self) -> usize

pub fn assignment_coord_dim(&self) -> usize

pub fn row_block_dim(&self) -> usize

pub fn coord_offsets(&self) -> Vec<usize>

pub fn assignments(&self) -> Array2<f64>

pub fn assignments_row(&self, row: usize) -> Array1<f64>

pub fn try_assignments_row(&self, row: usize) -> Result<Array1<f64>, String>

pub fn flatten_ext_coords(&self) -> Array1<f64>

pub fn from_blocks_with_mode( logits: Array2<f64>, coord_blocks: Vec<Array2<f64>>, mode: AssignmentMode, ) -> Result<Self, String>

pub fn from_blocks_with_mode_and_manifolds( logits: Array2<f64>, coord_blocks: Vec<Array2<f64>>, manifolds: Vec<LatentManifold>, mode: AssignmentMode, ) -> Result<Self, String>

Trait Implementations§

impl Clone for SaeAssignment

fn clone(&self) -> SaeAssignment

fn clone_from(&mut self, source: &Self)

impl Debug for SaeAssignment

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for SaeAssignment

impl RefUnwindSafe for SaeAssignment

impl Send for SaeAssignment

impl Sync for SaeAssignment

impl Unpin for SaeAssignment

impl UnsafeUnpin for SaeAssignment

impl UnwindSafe for SaeAssignment

Blanket Implementations§

impl<T> Allocation for Twhere T: RefUnwindSafe + Send + Sync,

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> ByRef<T> for T

fn by_ref(&self) -> &T

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DTwhere ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DTwhere ST: ?Sized, DT: ?Sized,

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DistributionExt for Twhere T: ?Sized,

fn rand<T>(&self, rng: &mut (impl Rng + ?Sized)) -> Twhere Self: Distribution<T>,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Imply<T> for Uwhere T: ?Sized, U: ?Sized,

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> Read<Exclusive, BecauseExclusive> for Twhere T: ?Sized,

impl<T> Same for T

type Output = T

impl<SS, SP> SupersetOf<SS> for SPwhere SS: SubsetOf<SP>,

fn to_subset(&self) -> Option<SS>

fn is_in_subset(&self) -> bool

fn to_subset_unchecked(&self) -> SS

fn from_subset(element: &SS) -> SP

impl<T> ToOwned for Twhere T: Clone,

Struct SaeAssignment

impl<T> Allocation for T
where T: RefUnwindSafe + Send + Sync,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DT
where ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DT
where ST: ?Sized, DT: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DistributionExt for T
where T: ?Sized,

fn rand<T>(&self, rng: &mut (impl Rng + ?Sized)) -> T
where Self: Distribution<T>,

impl<T, U> Imply<T> for U
where T: ?Sized, U: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> Read<Exclusive, BecauseExclusive> for T
where T: ?Sized,

impl<SS, SP> SupersetOf<SS> for SP
where SS: SubsetOf<SP>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,