Enum rust_bert::pipelines::common::TokenizerOption [−][src]
pub enum TokenizerOption {
Show 15 variants
Bert(BertTokenizer),
Roberta(RobertaTokenizer),
XLMRoberta(XLMRobertaTokenizer),
Marian(MarianTokenizer),
T5(T5Tokenizer),
Albert(AlbertTokenizer),
XLNet(XLNetTokenizer),
GPT2(Gpt2Tokenizer),
OpenAiGpt(OpenAiGptTokenizer),
Reformer(ReformerTokenizer),
ProphetNet(ProphetNetTokenizer),
Pegasus(PegasusTokenizer),
MBart50(MBart50Tokenizer),
M2M100(M2M100Tokenizer),
FNet(FNetTokenizer),
}Expand description
Variants
Bert(BertTokenizer)
Tuple Fields
Bert Tokenizer
Roberta(RobertaTokenizer)
Tuple Fields
Roberta Tokenizer
XLMRoberta(XLMRobertaTokenizer)
Tuple Fields
XLMRoberta Tokenizer
Marian(MarianTokenizer)
Tuple Fields
Marian Tokenizer
T5(T5Tokenizer)
Tuple Fields
0: T5TokenizerT5 Tokenizer
Albert(AlbertTokenizer)
Tuple Fields
Albert Tokenizer
XLNet(XLNetTokenizer)
Tuple Fields
XLNet Tokenizer
GPT2(Gpt2Tokenizer)
Tuple Fields
GPT2 Tokenizer
OpenAiGpt(OpenAiGptTokenizer)
Tuple Fields
GPT Tokenizer
Reformer(ReformerTokenizer)
Tuple Fields
Reformer Tokenizer
ProphetNet(ProphetNetTokenizer)
Tuple Fields
ProphetNet Tokenizer
Pegasus(PegasusTokenizer)
Tuple Fields
Pegasus Tokenizer
MBart50(MBart50Tokenizer)
Tuple Fields
MBart50 Tokenizer
M2M100(M2M100Tokenizer)
Tuple Fields
M2M100 Tokenizer
FNet(FNetTokenizer)
Tuple Fields
FNet Tokenizer
Implementations
Interface method to load a tokenizer from file
Returns the model type
Interface method
Interface method for pair encoding
pub fn encode_pair(
&self,
text_1: &str,
text_2: Option<&str>,
max_len: usize,
truncation_strategy: &TruncationStrategy,
stride: usize
) -> TokenizedInput
pub fn encode_pair(
&self,
text_1: &str,
text_2: Option<&str>,
max_len: usize,
truncation_strategy: &TruncationStrategy,
stride: usize
) -> TokenizedInput
Interface method for pair encoding (single input)
Interface method to tokenization
Interface method to tokenization
Interface method to tokenization
Interface method to decoding
pub fn build_input_with_special_tokens(
&self,
token_ids_with_offsets_1: TokenIdsWithOffsets,
token_ids_with_offsets_2: Option<TokenIdsWithOffsets>
) -> TokenizedInput
pub fn build_input_with_special_tokens(
&self,
token_ids_with_offsets_1: TokenIdsWithOffsets,
token_ids_with_offsets_2: Option<TokenIdsWithOffsets>
) -> TokenizedInput
Interface method to build input with special tokens
Interface method to convert tokens to ids
Interface method
Interface method
Interface method
Auto Trait Implementations
impl RefUnwindSafe for TokenizerOption
impl Send for TokenizerOption
impl Sync for TokenizerOption
impl Unpin for TokenizerOption
impl UnwindSafe for TokenizerOption
Blanket Implementations
Mutably borrows from an owned value. Read more
Instruments this type with the provided Span, returning an
Instrumented wrapper. Read more
type Output = T
type Output = T
Should always be Self
