Struct TransformerEncoderLayer

Source

pub struct TransformerEncoderLayer {
    pub self_attn: MultiheadAttention,
    pub linear1: Linear,
    pub dropout: f32,
    pub linear2: Linear,
    pub norm1: LayerNorm,
    pub norm2: LayerNorm,
    pub activation: fn(Tensor) -> Tensor,
    pub norm_first: bool,
    pub batch_first: bool,
}

Expand description

A single Transformer Encoder layer, analogous to torch.nn.TransformerEncoderLayer.

This layer implements a standard Transformer encoder block with a multi-head self-attention mechanism followed by a position-wise feedforward network. Layer normalization can be applied either before (“pre-norm”) or after (“post-norm”) the attention and feedforward sub-layers.

Fields§

§self_attn: MultiheadAttention

self_attn: The multi-head self-attention module.

§linear1: Linear

linear1: The first linear layer of the feedforward network (expansion).

§dropout: f32

dropout: Dropout probability applied after attention and feedforward layers.

§linear2: Linear

linear2: The second linear layer of the feedforward network (projection back to d_model).

§norm1: LayerNorm

norm1: LayerNorm applied after the self-attention block (or before if norm_first is true).

§norm2: LayerNorm

norm2: LayerNorm applied after the feedforward block (or before if norm_first is true).

§activation: fn(Tensor) -> Tensor

activation: The activation function used in the feedforward network (e.g., ReLU, GELU).

§norm_first: bool

norm_first: If true, applies layer normalization before each sub-layer (pre-norm).

§batch_first: bool

batch_first: If true, expects input tensors of shape (batch_size, seq_len, d_model).

Struct TransformerEncoderLayer Copy item path

Fields§

Implementations§

impl TransformerEncoderLayer

pub fn new( d_model: u64, nhead: u64, dim_feedforward: u64, dropout: f32, activation: fn(Tensor) -> Tensor, layer_norm_eps: f64, batch_first: bool, norm_first: bool, bias: bool, dtype: DType, ) -> Result<Self, ZyxError>

§Arguments

§Returns

pub fn forward( &self, src: impl Into<Tensor>, src_mask: Option<Tensor>, src_key_padding_mask: Option<Tensor>, ) -> Result<Tensor, ZyxError>

§Arguments

§Returns

Trait Implementations§

impl Debug for TransformerEncoderLayer

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'a> IntoIterator for &'a TransformerEncoderLayer

type Item = &'a Tensor

type IntoIter = IntoIter<&'a Tensor>

fn into_iter(self) -> Self::IntoIter

impl<'a> IntoIterator for &'a mut TransformerEncoderLayer

type Item = &'a mut Tensor

type IntoIter = IntoIter<&'a mut Tensor>

fn into_iter(self) -> Self::IntoIter

impl Module for TransformerEncoderLayer

fn iter<'a>(&'a self) -> impl Iterator<Item = &'a Tensor>

fn iter_mut<'a>(&'a mut self) -> impl Iterator<Item = &'a mut Tensor>

fn iter_tensors<'a>(&'a self) -> impl Iterator<Item = (String, &'a Tensor)>

fn iter_tensors_mut<'a>( &'a mut self, ) -> impl Iterator<Item = (String, &'a mut Tensor)>

fn realize(&self) -> Result<(), ZyxError>

fn set_params(&mut self, params: &mut HashMap<String, Tensor>)

fn save(&self, path: impl AsRef<Path>) -> Result<(), ZyxError>

Auto Trait Implementations§

impl Freeze for TransformerEncoderLayer

impl RefUnwindSafe for TransformerEncoderLayer

impl Send for TransformerEncoderLayer

impl Sync for TransformerEncoderLayer

impl Unpin for TransformerEncoderLayer

impl UnsafeUnpin for TransformerEncoderLayer

impl UnwindSafe for TransformerEncoderLayer

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct TransformerEncoderLayer

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,