Struct dfdx::nn::Transformer

source · [−]

pub struct Transformer<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> {
    pub encoder: TransformerEncoder<MODEL_DIM, NUM_HEADS, FF_DIM, NUM_ENCODER_LAYERS>,
    pub decoder: TransformerDecoder<MODEL_DIM, NUM_HEADS, FF_DIM, NUM_DECODER_LAYERS>,
}

Expand description

Requires Nightly Transformer architecture as described in Attention is all you need.

This is comprised of a TransformerEncoder and a TransformerDecoder.

Generics:

MODEL_DIM: Size of the input features to the encoder/decoder.
NUM_HEADS: Number of heads for MultiHeadAttention.
NUM_ENCODER_LAYERS: Number of TransformerEncoderBlock to use
NUM_DECODER_LAYERS: Number of TransformerDecoderBlock to use
FF_DIM: Feedforward hidden dimension for both encoder/decoder

Pytorch equivalent:

torch.nn.Transformer(
    d_model=MODEL_DIM,
    nhead=NUM_HEADS,
    num_encoder_layers=NUM_ENCODER_LAYERS,
    num_decoder_layers=NUM_DECODER_LAYERS,
    dim_feedforward=FF_DIM,
    batch_first=True,
)

Fields

encoder: TransformerEncoder<MODEL_DIM, NUM_HEADS, FF_DIM, NUM_ENCODER_LAYERS>decoder: TransformerDecoder<MODEL_DIM, NUM_HEADS, FF_DIM, NUM_DECODER_LAYERS>

Trait Implementations

source

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> CanUpdateWithGradients for Transformer<M, H, E, D, F>

source

fn update<G: GradientProvider>(
 &mut self,
 grads: &mut G,
 unused: &mut UnusedTensors
)

Updates self given the GradientProvider. When any parameters that are NOT present in G, then this function should add the tensor’s UniqueId to UnusedTensors. Read more

source

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Clone for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

source

fn clone(
&self
) -> Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

Returns a copy of the value. Read more

1.0.0 · source

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

source

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Debug for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

source

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

source

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Default for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

source

fn default(
) -> Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

Returns the “default value” for a type. Read more

source

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> LoadFromNpz for Transformer<M, H, E, D, F>

source

fn read<R: Read + Seek>(
 &mut self,
 p: &str,
 r: &mut ZipArchive<R>
) -> Result<(), NpzError>

Reads this object from a ZipArchive. r with a base filename of filename_prefix. Read more

source

fn load<P: AsRef<Path>>(&mut self, path: P) -> Result<(), NpzError>

Loads data from a .npz zip archive at the specified path. Read more

source

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize, Src, Tgt> Module<(Src, Tgt)> for Transformer<M, H, E, D, F>where
 Src: Tensor<Dtype = f32>,
 Tgt: Tensor<Dtype = f32> + PutTape<Src::Tape>,
 TransformerEncoder<M, H, F, E>: Module<Src, Output = Src>,
 TransformerDecoder<M, H, F, D>: Module<(<Tgt as PutTape<Src::Tape>>::Output, Src::NoTape), Output = <Tgt as PutTape<Src::Tape>>::Output>,

type Output = <Tgt as PutTape<<Src as Tensor>::Tape>>::Output

The type that this unit produces given Input.

source

fn forward(&self, (src, tgt): (Src, Tgt)) -> Self::Output

Forward Input through the module and produce Module::Output. Read more

source

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize, T> ModuleMut<T> for Transformer<M, H, E, D, F>where
Self: Module<T>,

type Output = <Transformer<M, H, E, D, F> as Module<T>>::Output

The type that this unit produces given Input.

source

fn forward_mut(&mut self, t: T) -> Self::Output

Forward Input through the module and produce ModuleMut::Output. Read more

source

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> ResetParams for Transformer<M, H, E, D, F>

source

fn reset_params<R: Rng>(&mut self, rng: &mut R)

Mutate the unit’s parameters using rand::Rng. Each implementor of this trait decides how the parameters are initialized. In fact, some impls may not even use the rng. Read more

source

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> SaveToNpz for Transformer<M, H, E, D, F>

source

fn write<W: Write + Seek>(&self, p: &str, w: &mut ZipWriter<W>) -> ZipResult<()>

Write this object into ZipWriter w with a base filename of filename_prefix. Read more

source

fn save<P: AsRef<Path>>(&self, path: P) -> ZipResult<()>

Save this object into the .npz file determined located at path. Read more

Auto Trait Implementations

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> RefUnwindSafe for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Send for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Sync for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Unpin for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> UnwindSafe for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

Blanket Implementations

source

impl<T> Any for Twhere
T: 'static + ?Sized,

source

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

source

impl<T> Borrow<T> for Twhere
T: ?Sized,

const: unstable · source

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

source

impl<T> BorrowMut<T> for Twhere
T: ?Sized,

const: unstable · source

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

source

impl<T> From<T> for T

const: unstable · source

fn from(t: T) -> T

Returns the argument unchanged.

source

impl<T, U> Into for Twhere
U: From<T>,

const: unstable · source

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

source

impl<T> ToOwned for Twhere
T: Clone,

type Owned = T

The resulting type after obtaining ownership.

source

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

source

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

source

impl<T, U> TryFrom for Twhere
U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

const: unstable · source

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

source

impl<T, U> TryInto for Twhere
U: TryFrom<T>,

type Error = >::Error

The type returned in the event of a conversion error.

const: unstable · source

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct dfdx::nn::Transformer

Fields

Trait Implementations

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> CanUpdateWithGradients for Transformer<M, H, E, D, F>

fn update<G: GradientProvider>( &mut self, grads: &mut G, unused: &mut UnusedTensors)

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Clone for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

fn clone( &self) -> Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

fn clone_from(&mut self, source: &Self)

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Debug for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Default for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

fn default() -> Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> LoadFromNpz for Transformer<M, H, E, D, F>

fn read<R: Read + Seek>( &mut self, p: &str, r: &mut ZipArchive<R>) -> Result<(), NpzError>

fn load<P: AsRef<Path>>(&mut self, path: P) -> Result<(), NpzError>

type Output = <Tgt as PutTape<<Src as Tensor>::Tape>>::Output

fn forward(&self, (src, tgt): (Src, Tgt)) -> Self::Output

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize, T> ModuleMut<T> for Transformer<M, H, E, D, F>where Self: Module<T>,

type Output = <Transformer<M, H, E, D, F> as Module<T>>::Output

fn forward_mut(&mut self, t: T) -> Self::Output

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> ResetParams for Transformer<M, H, E, D, F>

fn reset_params<R: Rng>(&mut self, rng: &mut R)

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize> SaveToNpz for Transformer<M, H, E, D, F>

fn write<W: Write + Seek>(&self, p: &str, w: &mut ZipWriter<W>) -> ZipResult<()>

fn save<P: AsRef<Path>>(&self, path: P) -> ZipResult<()>

Auto Trait Implementations

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> RefUnwindSafe for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Send for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Sync for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> Unpin for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

impl<const MODEL_DIM: usize, const NUM_HEADS: usize, const NUM_ENCODER_LAYERS: usize, const NUM_DECODER_LAYERS: usize, const FF_DIM: usize> UnwindSafe for Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

Blanket Implementations

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

fn update<G: GradientProvider>(
&mut self,
grads: &mut G,
unused: &mut UnusedTensors
)

fn clone(
&self
) -> Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

fn default(
) -> Transformer<MODEL_DIM, NUM_HEADS, NUM_ENCODER_LAYERS, NUM_DECODER_LAYERS, FF_DIM>

fn read<R: Read + Seek>(
&mut self,
p: &str,
r: &mut ZipArchive<R>
) -> Result<(), NpzError>

impl<const M: usize, const H: usize, const E: usize, const D: usize, const F: usize, T> ModuleMut<T> for Transformer<M, H, E, D, F>where
Self: Module<T>,

impl<T> Any for Twhere
T: 'static + ?Sized,

impl<T> Borrow<T> for Twhere
T: ?Sized,

impl<T> BorrowMut<T> for Twhere
T: ?Sized,

impl<T, U> Into<U> for Twhere
U: From<T>,

impl<T> ToOwned for Twhere
T: Clone,

impl<T, U> TryFrom<U> for Twhere
U: Into<T>,

impl<T, U> TryInto<U> for Twhere
U: TryFrom<T>,

impl<V, T> VZip<V> for Twhere
V: MultiLane<T>,