Struct rust_bert::t5::T5Model[−][src]

pub struct T5Model { /* fields omitted */ }

Expand description

T5 Base model

Base architecture for T5 model. Usually complemented with a task-specific head, such as a language model head. It is made of the following blocks:

encoder: T5Stack (transformer) made of a vector of encoding layers
decoder: T5Stack (transformer) made of a vector of decoding layers with self attention and encoder cross-attention. caching is implemented for the decoder to avoid recalculating static states (encoder key/values and previously calculated decoder key/values)
embeddings: nn::Embedding Shared embeddings for the encoder and decoder.

Implementations

`impl T5Model`[src]

`pub fn new<'p, P>( p: P, config: &T5Config, output_attentions: bool, output_hidden_states: bool ) -> T5Model where P: Borrow<Path<'p>>,` [src]

Build a new T5Model

Arguments

p - Variable store path for the root of the BART model
config - T5Config object defining the model architecture
output_attention - flag indicating if the model should output the attention weights of intermediate layers
output_hidden_states - flag indicating if the model should output the hidden states weights of intermediate layers

Example

use rust_bert::t5::{T5Config, T5Model};
use rust_bert::Config;
use std::path::Path;
use tch::{nn, Device};

let config_path = Path::new("path/to/config.json");
let device = Device::Cpu;
let p = nn::VarStore::new(device);
let config = T5Config::from_file(config_path);
let output_attentions = true;
let output_hidden_states = true;
let t5: T5Model = T5Model::new(
    &p.root() / "t5",
    &config,
    output_attentions,
    output_hidden_states,
);

`pub fn forward_t( &self, input_ids: Option<&Tensor>, attention_mask: Option<&Tensor>, encoder_outputs: Option<&Tensor>, decoder_input_ids: Option<&Tensor>, decoder_attention_mask: Option<&Tensor>, input_embeds: Option<Tensor>, decoder_input_embeds: Option<Tensor>, old_layer_states: Option<Vec<(Option<LayerState>, Option<LayerState>)>>, train: bool ) -> T5ModelOutput`[src]

Forward pass through the model

Arguments

input_ids - Optional input tensor of shape (batch size, source_sequence_length). This or input_embeds must be provided.
attention_mask - Optional attention mask of shape (batch size, source_sequence_length) for the encoder positions. Positions with a mask with value 0 will be masked.
decoder_input_ids - Optional input tensor of shape (batch size, target_sequence_length). This or decoder_input_embeds must be provided.
encoder_outputs - Optional tuple made of a tensor of shape (batch size, source_sequence_length, encoder_hidden_dim) and optional vectors of tensors of length num_encoder_layers with shape (batch size, source_sequence_length, hidden_size). These correspond to the encoder last hidden state and optional hidden states/attention weights for encoder layers. When provided, the encoder hidden state will not be recalculated. Useful for generation tasks.
decoder_attention_mask - Optional attention mask of shape (batch size, target_sequence_length) for the decoder positions. Positions with a mask with value 0 will be masked.
input_embeds - Optional input tensor of shape (batch size, source_sequence_length, embeddings dimension). This or input_ids must be provided.
decoder_input_embeds - Optional input tensor of shape (batch size, target_sequence_length, embeddings dimension). This or decoder_input_ids must be provided.
old_layer_states - Optional vector of length num_layers containing tuples of optional LayerStates containing the last calculated key and value pairs for the decoder. This avoids recomputing attention weights at past positions and speeds up decoding.
train - boolean flag to turn on/off the dropout layers in the model. Should be set to false for inference.

Returns

T5ModelOutput containing:
- decoder_output - Tensor of shape (batch size, target_sequence_length, hidden_size) representing the activations of the last decoder hidden state
- encoder_hidden_states - Tensor of shape (batch size, source_sequence_length, hidden_size) representing the activations of the last encoder hidden state
- cache - Option<Vec<(Option<Vec<LayerState, LayerState>>)>> of length n_layer containing the encoder padding mask and past keys and values for both the self attention and the encoder cross attention of each layer of the decoder.
- all_encoder_hidden_states - Option<Vec<Tensor>> of length num_encoder_layers with shape (batch size, source_sequence_length, hidden_size)
- all_encoder_attentions - Option<Vec<Tensor>> of length num_encoder_layers with shape (batch size, source_sequence_length, hidden_size)
- all_decoder_hidden_states - Option<Vec<Tensor>> of length num_decoder_layers with shape (batch size, target_sequence_length, hidden_size)
- all_decoder_attentions - Option<Vec<Tensor>> of length num_decoder_layers with shape (batch size, target_sequence_length, hidden_size)

Example

use rust_bert::t5::{T5Config, T5Model};
let (batch_size, source_sequence_length, target_sequence_length) = (64, 128, 56);
let input_tensor = Tensor::rand(&[batch_size, source_sequence_length], (Int64, device));
let target_tensor = Tensor::rand(&[batch_size, target_sequence_length], (Int64, device));
let encoder_attention_mask =
    Tensor::ones(&[batch_size, source_sequence_length], (Int64, device));
let decoder_attention_mask =
    Tensor::ones(&[batch_size, source_sequence_length], (Int64, device));

let model_output = no_grad(|| {
    t5_model.forward_t(
        Some(&input_tensor),
        Some(&encoder_attention_mask),
        None,
        Some(&target_tensor),
        Some(&decoder_attention_mask),
        None,
        None,
        None,
        false,
    )
});

Auto Trait Implementations

`impl RefUnwindSafe for T5Model`

`impl Send for T5Model`

`impl !Sync for T5Model`

`impl Unpin for T5Model`

`impl UnwindSafe for T5Model`

Blanket Implementations

`impl<T> Any for T where T: 'static + ?Sized,` [src]

`pub fn type_id(&self) -> TypeId`[src]

Gets the TypeId of self. Read more

`impl<T> Borrow<T> for T where T: ?Sized,` [src]

`pub fn borrow(&self) -> &T`[src]

Immutably borrows from an owned value. Read more

`impl<T> BorrowMut<T> for T where T: ?Sized,` [src]

`pub fn borrow_mut(&mut self) -> &mut T`[src]

Mutably borrows from an owned value. Read more

`impl<T> From<T> for T`[src]

`pub fn from(t: T) -> T`[src]

Performs the conversion.

`impl<T> Instrument for T`[src]

`fn instrument(self, span: Span) -> Instrumented<Self>`[src]

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

`fn in_current_span(self) -> Instrumented<Self>`[src]

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

`impl<T, U> Into for T where U: From<T>,` [src]

`pub fn into(self) -> U`[src]

Performs the conversion.

`impl<T> Pointable for T`

`pub const ALIGN: usize`

The alignment of pointer.

`type Init = T`

The type for initializers.

`pub unsafe fn init(init: <T as Pointable>::Init) -> usize`

Initializes a with the given initializer. Read more

`pub unsafe fn deref<'a>(ptr: usize) -> &'a T`

Dereferences the given pointer. Read more

`pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T`

Mutably dereferences the given pointer. Read more

`pub unsafe fn drop(ptr: usize)`

Drops the object pointed to by the given pointer. Read more

`impl<T> Same<T> for T`

`type Output = T`

Should always be Self

`impl<T, U> TryFrom for T where U: Into<T>,` [src]

`type Error = Infallible`

The type returned in the event of a conversion error.

`pub fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>`[src]

Performs the conversion.

`impl<T, U> TryInto for T where U: TryFrom<T>,` [src]

`type Error = >::Error`

The type returned in the event of a conversion error.

`pub fn try_into(self) -> Result<U, >::Error>`[src]

Performs the conversion.

Struct rust_bert::t5::T5Model[−][src]

T5 Base model

Implementations

impl T5Model[src]

pub fn new<'p, P>( p: P, config: &T5Config, output_attentions: bool, output_hidden_states: bool) -> T5Model where P: Borrow<Path<'p>>, [src]

Arguments

Example

Arguments

Returns

Example

Auto Trait Implementations

impl RefUnwindSafe for T5Model

impl Send for T5Model

impl !Sync for T5Model

impl Unpin for T5Model

impl UnwindSafe for T5Model

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized, [src]

pub fn type_id(&self) -> TypeId[src]

impl<T> Borrow<T> for T where T: ?Sized, [src]

pub fn borrow(&self) -> &T[src]

impl<T> BorrowMut<T> for T where T: ?Sized, [src]

pub fn borrow_mut(&mut self) -> &mut T[src]

impl<T> From<T> for T[src]

pub fn from(t: T) -> T[src]

impl<T> Instrument for T[src]

fn instrument(self, span: Span) -> Instrumented<Self>[src]

fn in_current_span(self) -> Instrumented<Self>[src]

impl<T, U> Into<U> for T where U: From<T>, [src]

pub fn into(self) -> U[src]

impl<T> Pointable for T

pub const ALIGN: usize

type Init = T

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

pub unsafe fn drop(ptr: usize)

impl<T> Same<T> for T

type Output = T

impl<T, U> TryFrom<U> for T where U: Into<T>, [src]

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>[src]

impl<T, U> TryInto<U> for T where U: TryFrom<T>, [src]

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>[src]

impl<V, T> VZip<V> for T where V: MultiLane<T>,

pub fn vzip(self) -> V

`impl T5Model`[src]

`pub fn new<'p, P>( p: P, config: &T5Config, output_attentions: bool, output_hidden_states: bool ) -> T5Model where P: Borrow<Path<'p>>,` [src]

`impl RefUnwindSafe for T5Model`

`impl Send for T5Model`

`impl !Sync for T5Model`

`impl Unpin for T5Model`

`impl UnwindSafe for T5Model`

`impl<T> Any for T where T: 'static + ?Sized,` [src]

`pub fn type_id(&self) -> TypeId`[src]

`impl<T> Borrow<T> for T where T: ?Sized,` [src]

`pub fn borrow(&self) -> &T`[src]

`impl<T> BorrowMut<T> for T where T: ?Sized,` [src]

`pub fn borrow_mut(&mut self) -> &mut T`[src]

`impl<T> From<T> for T`[src]

`pub fn from(t: T) -> T`[src]

`impl<T> Instrument for T`[src]

`fn instrument(self, span: Span) -> Instrumented<Self>`[src]

`fn in_current_span(self) -> Instrumented<Self>`[src]

`impl<T, U> Into<U> for T where U: From<T>,` [src]

`pub fn into(self) -> U`[src]

`impl<T> Pointable for T`

`pub const ALIGN: usize`

`type Init = T`

`pub unsafe fn init(init: <T as Pointable>::Init) -> usize`

`pub unsafe fn deref<'a>(ptr: usize) -> &'a T`

`pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T`

`pub unsafe fn drop(ptr: usize)`

`impl<T> Same<T> for T`

`type Output = T`

`impl<T, U> TryFrom<U> for T where U: Into<T>,` [src]

`type Error = Infallible`

`pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>`[src]

`impl<T, U> TryInto<U> for T where U: TryFrom<T>,` [src]

`type Error = <U as TryFrom<T>>::Error`

`pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>`[src]

`impl<V, T> VZip<V> for T where V: MultiLane<T>,`

`pub fn vzip(self) -> V`