pub struct RotaryEncoding<B>where
B: Backend,{
pub freq_complex: Tensor<B, 3>,
pub max_sequence_length: usize,
pub theta: f32,
}
Expand description
A module that applies rotary positional encoding to a tensor. Rotary Position Encoding or Embedding (RoPE), is a type of position embedding which encodes absolute positional information with rotation matrix and naturally incorporates explicit relative position dependency in self-attention formulation.
Introduced in the paper: RoFormer: Enhanced Transformer with Rotary Position Embedding
Should be created using RotaryEncodingConfig.
Fields§
§freq_complex: Tensor<B, 3>
Frequency Tensor of shape (max_sequence_length, d_model, 2) with real and imaginary components
max_sequence_length: usize
Maximum sequence length of input
theta: f32
Scaling factor for frequency computation.
Implementations§
Source§impl<B> RotaryEncoding<B>where
B: Backend,
impl<B> RotaryEncoding<B>where
B: Backend,
Sourcepub fn forward<const D: usize>(&self, x: Tensor<B, D>) -> Tensor<B, D>
pub fn forward<const D: usize>(&self, x: Tensor<B, D>) -> Tensor<B, D>
Applies rotary positional encoding to a tensor of dimensions (…, seq_len, d_model)
Arguments:
x
- Input tensor of shape (…, seq_len, d_model). Accommodate both 3D and 4D tensors for (batch size, seq_len, hidden_dim) or (batch size, num_heads, seq_len, hidden_dim) respectively.
Returns:
- Output tensor with the same shape as input tensor after applying rotary encoding.
Panics if the input tensor does not have at least 2 dimensions for sequence length and hidden dimension.
Sourcepub fn apply<const D: usize>(
&self,
x: Tensor<B, D>,
start: usize,
) -> Tensor<B, D>
pub fn apply<const D: usize>( &self, x: Tensor<B, D>, start: usize, ) -> Tensor<B, D>
Applies rotary positional encoding to a tensor of dimensions (…, seq_len, d_model)
Arguments:
x
- Input tensor of shape (…, seq_len, d_model). Accommodate both 3D and 4D tensors for (batch size, seq_len, hidden_dim) or (batch size, num_heads, seq_len, hidden_dim) respectively.start
- Sequence start position index.
Returns:
- Output tensor with the same shape as input tensor after applying rotary encoding.
Panics if the input tensor does not have at least 2 dimensions for sequence length and hidden dimension.
Trait Implementations§
Source§impl<B> AutodiffModule<B> for RotaryEncoding<B>
impl<B> AutodiffModule<B> for RotaryEncoding<B>
Source§type InnerModule = RotaryEncoding<<B as AutodiffBackend>::InnerBackend>
type InnerModule = RotaryEncoding<<B as AutodiffBackend>::InnerBackend>
Source§fn valid(&self) -> <RotaryEncoding<B> as AutodiffModule<B>>::InnerModule
fn valid(&self) -> <RotaryEncoding<B> as AutodiffModule<B>>::InnerModule
Source§impl<B> Clone for RotaryEncoding<B>where
B: Backend,
impl<B> Clone for RotaryEncoding<B>where
B: Backend,
Source§fn clone(&self) -> RotaryEncoding<B>
fn clone(&self) -> RotaryEncoding<B>
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
source
. Read moreSource§impl<B> Debug for RotaryEncoding<B>
impl<B> Debug for RotaryEncoding<B>
Source§impl<B> Display for RotaryEncoding<B>where
B: Backend,
impl<B> Display for RotaryEncoding<B>where
B: Backend,
Source§impl<B> Module<B> for RotaryEncoding<B>where
B: Backend,
impl<B> Module<B> for RotaryEncoding<B>where
B: Backend,
Source§type Record = RotaryEncodingRecord<B>
type Record = RotaryEncodingRecord<B>
Source§fn load_record(
self,
record: <RotaryEncoding<B> as Module<B>>::Record,
) -> RotaryEncoding<B>
fn load_record( self, record: <RotaryEncoding<B> as Module<B>>::Record, ) -> RotaryEncoding<B>
Source§fn into_record(self) -> <RotaryEncoding<B> as Module<B>>::Record
fn into_record(self) -> <RotaryEncoding<B> as Module<B>>::Record
Source§fn num_params(&self) -> usize
fn num_params(&self) -> usize
Source§fn visit<Visitor>(&self, visitor: &mut Visitor)where
Visitor: ModuleVisitor<B>,
fn visit<Visitor>(&self, visitor: &mut Visitor)where
Visitor: ModuleVisitor<B>,
Source§fn map<Mapper>(self, mapper: &mut Mapper) -> RotaryEncoding<B>where
Mapper: ModuleMapper<B>,
fn map<Mapper>(self, mapper: &mut Mapper) -> RotaryEncoding<B>where
Mapper: ModuleMapper<B>,
Source§fn collect_devices(
&self,
devices: Vec<<B as Backend>::Device>,
) -> Vec<<B as Backend>::Device>
fn collect_devices( &self, devices: Vec<<B as Backend>::Device>, ) -> Vec<<B as Backend>::Device>
Source§fn to_device(self, device: &<B as Backend>::Device) -> RotaryEncoding<B>
fn to_device(self, device: &<B as Backend>::Device) -> RotaryEncoding<B>
Source§fn fork(self, device: &<B as Backend>::Device) -> RotaryEncoding<B>
fn fork(self, device: &<B as Backend>::Device) -> RotaryEncoding<B>
Source§fn devices(&self) -> Vec<<B as Backend>::Device>
fn devices(&self) -> Vec<<B as Backend>::Device>
Source§fn save_file<FR, PB>(
self,
file_path: PB,
recorder: &FR,
) -> Result<(), RecorderError>
fn save_file<FR, PB>( self, file_path: PB, recorder: &FR, ) -> Result<(), RecorderError>
Source§fn load_file<FR, PB>(
self,
file_path: PB,
recorder: &FR,
device: &<B as Backend>::Device,
) -> Result<Self, RecorderError>
fn load_file<FR, PB>( self, file_path: PB, recorder: &FR, device: &<B as Backend>::Device, ) -> Result<Self, RecorderError>
Source§fn quantize_weights(self, quantizer: &mut Quantizer) -> Self
fn quantize_weights(self, quantizer: &mut Quantizer) -> Self
Source§impl<B> ModuleDisplay for RotaryEncoding<B>where
B: Backend,
impl<B> ModuleDisplay for RotaryEncoding<B>where
B: Backend,
Source§fn custom_settings(&self) -> Option<DisplaySettings>
fn custom_settings(&self) -> Option<DisplaySettings>
Auto Trait Implementations§
impl<B> Freeze for RotaryEncoding<B>where
<B as Backend>::FloatTensorPrimitive: Freeze,
<B as Backend>::QuantizedTensorPrimitive: Freeze,
impl<B> RefUnwindSafe for RotaryEncoding<B>where
<B as Backend>::FloatTensorPrimitive: RefUnwindSafe,
<B as Backend>::QuantizedTensorPrimitive: RefUnwindSafe,
impl<B> Send for RotaryEncoding<B>
impl<B> Sync for RotaryEncoding<B>
impl<B> Unpin for RotaryEncoding<B>
impl<B> UnwindSafe for RotaryEncoding<B>where
<B as Backend>::FloatTensorPrimitive: UnwindSafe,
<B as Backend>::QuantizedTensorPrimitive: UnwindSafe,
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left
is true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left(&self)
returns true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read more