Struct TextGenerationConfig

Source

pub struct TextGenerationConfig {Show 21 fields
    pub model_type: ModelType,
    pub model_resource: ModelResource,
    pub config_resource: Box<dyn ResourceProvider + Send>,
    pub vocab_resource: Box<dyn ResourceProvider + Send>,
    pub merges_resource: Option<Box<dyn ResourceProvider + Send>>,
    pub min_length: i64,
    pub max_length: Option<i64>,
    pub do_sample: bool,
    pub early_stopping: bool,
    pub num_beams: i64,
    pub temperature: f64,
    pub top_k: i64,
    pub top_p: f64,
    pub repetition_penalty: f64,
    pub length_penalty: f64,
    pub no_repeat_ngram_size: i64,
    pub num_return_sequences: i64,
    pub num_beam_groups: Option<i64>,
    pub diversity_penalty: Option<f64>,
    pub device: Device,
    pub kind: Option<Kind>,
}

Expand description

§Configuration for text generation

Contains information regarding the model to load, mirrors the GenerateConfig, with a different set of default parameters and sets the device to place the model on.

Fields§

§model_type: ModelType

Model type

§model_resource: ModelResource

Model weights resource (default: pretrained BART model on CNN-DM)

§config_resource: Box<dyn ResourceProvider + Send>

Config resource (default: pretrained BART model on CNN-DM)

§vocab_resource: Box<dyn ResourceProvider + Send>

Vocab resource (default: pretrained BART model on CNN-DM)

§merges_resource: Option<Box<dyn ResourceProvider + Send>>

Merges resource (default: pretrained BART model on CNN-DM)

§min_length: i64

Minimum sequence length (default: 0)

§max_length: Option<i64>

Maximum sequence length (default: 56)

§do_sample: bool

Sampling flag. If true, will perform top-k and/or nucleus sampling on generated tokens, otherwise greedy (deterministic) decoding (default: true)

§early_stopping: bool

Early stopping flag indicating if the beam search should stop as soon as num_beam hypotheses have been generated (default: false)

§num_beams: i64

Number of beams for beam search (default: 5)

§temperature: f64

Temperature setting. Values higher than 1 will improve originality at the risk of reducing relevance (default: 1.0)

§top_k: i64

Top_k values for sampling tokens. Value higher than 0 will enable the feature (default: 0)

§top_p: f64

Top_p value for Nucleus sampling, Holtzman et al.. Keep top tokens until cumulative probability reaches top_p (default: 0.9)

§repetition_penalty: f64

Repetition penalty (mostly useful for CTRL decoders). Values higher than 1 will penalize tokens that have been already generated. (default: 1.0)

§length_penalty: f64

Exponential penalty based on the length of the hypotheses generated (default: 1.0)

§no_repeat_ngram_size: i64

Number of allowed repetitions of n-grams. Values higher than 0 turn on this feature and will prevent repeats of n-grams with a length equal or greater to this value (default: 0)

§num_return_sequences: i64

Number of sequences to return for each prompt text (default: 1)

§num_beam_groups: Option<i64>

Number of beam groups for diverse beam generation. If provided and higher than 1, will split the beams into beam subgroups leading to more diverse generation.

§diversity_penalty: Option<f64>

Diversity penalty for diverse beam search. High values will enforce more difference between beam groups (default: 5.5)

§device: Device

Device to place the model on (default: CUDA/GPU when available)

§kind: Option<Kind>

Model weights precision. If not provided, will default to full precision on CPU, or the loaded weights precision otherwise

Struct TextGenerationConfigCopy item path

§Configuration for text generation

Fields§

Implementations§

impl TextGenerationConfig

pub fn new<RC, RV>( model_type: ModelType, model_resource: ModelResource, config_resource: RC, vocab_resource: RV, merges_resource: Option<RV>, ) -> TextGenerationConfigwhere RC: ResourceProvider + Send + 'static, RV: ResourceProvider + Send + 'static,

§Arguments

Trait Implementations§

impl Default for TextGenerationConfig

fn default() -> TextGenerationConfig

impl From<TextGenerationConfig> for GenerateConfig

fn from(config: TextGenerationConfig) -> GenerateConfig

Auto Trait Implementations§

impl Freeze for TextGenerationConfig

impl !RefUnwindSafe for TextGenerationConfig

impl Send for TextGenerationConfig

impl Sync for TextGenerationConfig

impl Unpin for TextGenerationConfig

impl !UnwindSafe for TextGenerationConfig

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> Same for T

type Output = T

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> ErasedDestructor for Twhere T: 'static,

impl<T> MaybeSendSync for T

Struct TextGenerationConfig

pub fn new<RC, RV>( model_type: ModelType, model_resource: ModelResource, config_resource: RC, vocab_resource: RV, merges_resource: Option<RV>, ) -> TextGenerationConfig
where RC: ResourceProvider + Send + 'static, RV: ResourceProvider + Send + 'static,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<T> ErasedDestructor for T
where T: 'static,