pub struct AttentionParams {
pub num_heads: usize,
pub num_kv_heads: usize,
pub head_dim: usize,
pub softmax_scale: f32,
pub causal: bool,
}Expand description
Parameters describing a single attention call.
Fields§
§num_heads: usize§num_kv_heads: usize§head_dim: usize§softmax_scale: f32Softmax scale (typically 1 / sqrt(head_dim)).
causal: boolWhether to apply a causal mask.
Trait Implementations§
Source§impl Clone for AttentionParams
impl Clone for AttentionParams
Source§fn clone(&self) -> AttentionParams
fn clone(&self) -> AttentionParams
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreAuto Trait Implementations§
impl Freeze for AttentionParams
impl RefUnwindSafe for AttentionParams
impl Send for AttentionParams
impl Sync for AttentionParams
impl Unpin for AttentionParams
impl UnsafeUnpin for AttentionParams
impl UnwindSafe for AttentionParams
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more