pub struct TokenizationStats {
pub total_tokens: usize,
pub unique_tokens: usize,
pub special_tokens_count: usize,
pub average_token_length: f64,
pub compression_ratio: f64,
pub oov_count: usize,
pub token_type_distribution: HashMap<String, usize>,
pub longest_token: Option<String>,
pub shortest_token: Option<String>,
}Expand description
Statistics about tokenization
Fields§
§total_tokens: usize§unique_tokens: usize§special_tokens_count: usize§average_token_length: f64§compression_ratio: f64§oov_count: usize§token_type_distribution: HashMap<String, usize>§longest_token: Option<String>§shortest_token: Option<String>Trait Implementations§
Source§impl Clone for TokenizationStats
impl Clone for TokenizationStats
Source§fn clone(&self) -> TokenizationStats
fn clone(&self) -> TokenizationStats
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for TokenizationStats
impl Debug for TokenizationStats
Source§impl<'de> Deserialize<'de> for TokenizationStats
impl<'de> Deserialize<'de> for TokenizationStats
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for TokenizationStats
impl RefUnwindSafe for TokenizationStats
impl Send for TokenizationStats
impl Sync for TokenizationStats
impl Unpin for TokenizationStats
impl UnsafeUnpin for TokenizationStats
impl UnwindSafe for TokenizationStats
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
Source§fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
Save to file
Source§fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
Load from file
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more