pub struct BinaryTokenizer {
pub vocab: HashMap<String, u32>,
pub id_to_token: HashMap<u32, String>,
pub special_tokens: HashMap<String, u32>,
pub scores: Option<HashMap<u32, f32>>,
pub merges: Option<Vec<(String, String)>>,
pub config: HashMap<String, Value>,
pub normalization_rules: Option<Vec<NormalizationRule>>,
pub pre_tokenization_rules: Option<Vec<PreTokenizationRule>>,
}Expand description
Binary tokenizer representation
Fields§
§vocab: HashMap<String, u32>Vocabulary mapping from tokens to IDs
id_to_token: HashMap<u32, String>Reverse mapping from IDs to tokens
special_tokens: HashMap<String, u32>Special tokens with their IDs
scores: Option<HashMap<u32, f32>>Token scores for ranking (if applicable)
merges: Option<Vec<(String, String)>>Merges for BPE tokenizers (if applicable)
config: HashMap<String, Value>Additional tokenizer-specific configuration
normalization_rules: Option<Vec<NormalizationRule>>Normalization rules
pre_tokenization_rules: Option<Vec<PreTokenizationRule>>Pre-tokenization rules
Trait Implementations§
Source§impl Clone for BinaryTokenizer
impl Clone for BinaryTokenizer
Source§fn clone(&self) -> BinaryTokenizer
fn clone(&self) -> BinaryTokenizer
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for BinaryTokenizer
impl Debug for BinaryTokenizer
Source§impl<'de> Deserialize<'de> for BinaryTokenizer
impl<'de> Deserialize<'de> for BinaryTokenizer
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for BinaryTokenizer
impl RefUnwindSafe for BinaryTokenizer
impl Send for BinaryTokenizer
impl Sync for BinaryTokenizer
impl Unpin for BinaryTokenizer
impl UnsafeUnpin for BinaryTokenizer
impl UnwindSafe for BinaryTokenizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
Source§fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
Save to file
Source§fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
Load from file
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more