pub struct MultiscreenModelConfig {
pub vocab_size: usize,
pub seq_len: usize,
pub layers: usize,
pub tiles: usize,
pub d_model: usize,
pub d_key: usize,
pub d_value: usize,
pub w_th: f32,
}Expand description
Paper-faithful neural Multiscreen model configuration.
Fields§
§vocab_size: usizeVocabulary size.
seq_len: usizeContext length T.
layers: usizePaper N_L: number of residual Multiscreen layers.
tiles: usizePaper N_H: number of gated screening tiles per layer.
d_model: usizePaper d_E: token embedding/model width.
d_key: usizePaper d_K: query/key width. Must be at least 2 for MiPE.
d_value: usizePaper d_V: value/gate width.
w_th: f32Paper MiPE threshold w_th.
Implementations§
Source§impl MultiscreenModelConfig
impl MultiscreenModelConfig
pub fn tiny() -> Self
pub fn tiny_for_tests() -> Self
pub fn for_parameter_budget( budget: MultiscreenParameterBudget, vocab_size: usize, seq_len: usize, ) -> Self
pub fn preset_1m(vocab_size: usize, seq_len: usize) -> Self
pub fn preset_5m(vocab_size: usize, seq_len: usize) -> Self
pub fn preset_10m(vocab_size: usize, seq_len: usize) -> Self
pub fn preset_50m(vocab_size: usize, seq_len: usize) -> Self
pub fn preset_100m(vocab_size: usize, seq_len: usize) -> Self
pub fn paper_10m(vocab_size: usize, seq_len: usize) -> Self
pub fn estimated_parameter_count(&self) -> usize
pub fn validate(&self) -> Result<()>
Trait Implementations§
Source§impl Clone for MultiscreenModelConfig
impl Clone for MultiscreenModelConfig
Source§fn clone(&self) -> MultiscreenModelConfig
fn clone(&self) -> MultiscreenModelConfig
Returns a duplicate of the value. Read more
1.0.0 (const: unstable) · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for MultiscreenModelConfig
impl Debug for MultiscreenModelConfig
Source§impl<'de> Deserialize<'de> for MultiscreenModelConfig
impl<'de> Deserialize<'de> for MultiscreenModelConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Source§impl PartialEq for MultiscreenModelConfig
impl PartialEq for MultiscreenModelConfig
Source§fn eq(&self, other: &MultiscreenModelConfig) -> bool
fn eq(&self, other: &MultiscreenModelConfig) -> bool
Tests for
self and other values to be equal, and is used by ==.Source§impl Serialize for MultiscreenModelConfig
impl Serialize for MultiscreenModelConfig
impl StructuralPartialEq for MultiscreenModelConfig
Auto Trait Implementations§
impl Freeze for MultiscreenModelConfig
impl RefUnwindSafe for MultiscreenModelConfig
impl Send for MultiscreenModelConfig
impl Sync for MultiscreenModelConfig
impl Unpin for MultiscreenModelConfig
impl UnsafeUnpin for MultiscreenModelConfig
impl UnwindSafe for MultiscreenModelConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more