pub struct MuonConfig {
pub learning_rate: f32,
pub momentum: f32,
pub ns_steps: usize,
pub min_dim_2d: usize,
pub fallback_lr: f32,
pub fallback_momentum: f32,
pub weight_decay: f32,
pub use_orthogonal: bool,
}Expand description
Configuration for Muon optimizer
Fields§
§learning_rate: f32Learning rate (default: 0.02)
momentum: f32Momentum coefficient (default: 0.95)
ns_steps: usizeNewton-Schulz iteration steps (default: 5)
min_dim_2d: usizeMinimum dimension for 2D optimization (default: 64)
fallback_lr: f32Fallback optimizer learning rate for 1D parameters (default: 1e-3)
fallback_momentum: f32Fallback momentum for 1D parameters (default: 0.9)
weight_decay: f32Weight decay coefficient (default: 0.0)
use_orthogonal: boolWhether to use orthogonalization (default: true)
Trait Implementations§
Source§impl Clone for MuonConfig
impl Clone for MuonConfig
Source§fn clone(&self) -> MuonConfig
fn clone(&self) -> MuonConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for MuonConfig
impl Debug for MuonConfig
Source§impl Default for MuonConfig
impl Default for MuonConfig
Source§impl<'de> Deserialize<'de> for MuonConfig
impl<'de> Deserialize<'de> for MuonConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for MuonConfig
impl RefUnwindSafe for MuonConfig
impl Send for MuonConfig
impl Sync for MuonConfig
impl Unpin for MuonConfig
impl UnwindSafe for MuonConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
Source§fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
Save to file
Source§fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
Load from file
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more