pub struct CountVectorizer { /* private fields */ }Expand description
Count vectorizer that uses a bag-of-words representation
Implementations§
Source§impl CountVectorizer
impl CountVectorizer
Sourcepub fn with_tokenizer(
tokenizer: Box<dyn Tokenizer + Send + Sync>,
binary: bool,
) -> Self
pub fn with_tokenizer( tokenizer: Box<dyn Tokenizer + Send + Sync>, binary: bool, ) -> Self
Create a count vectorizer with a custom tokenizer
Sourcepub fn vocabulary(&self) -> &Vocabulary
pub fn vocabulary(&self) -> &Vocabulary
Get a reference to the vocabulary
Sourcepub fn vocabulary_size(&self) -> usize
pub fn vocabulary_size(&self) -> usize
Get the vocabulary size
Sourcepub fn get_feature_count(
&self,
matrix: &Array2<f64>,
document_index: usize,
feature_index: usize,
) -> Option<f64>
pub fn get_feature_count( &self, matrix: &Array2<f64>, document_index: usize, feature_index: usize, ) -> Option<f64>
Get feature count for a specific document and feature index from a matrix
Sourcepub fn vocabulary_map(&self) -> HashMap<String, usize>
pub fn vocabulary_map(&self) -> HashMap<String, usize>
Get vocabulary as HashMap for compatibility with visualization
Trait Implementations§
Source§impl Clone for CountVectorizer
impl Clone for CountVectorizer
Source§impl Default for CountVectorizer
impl Default for CountVectorizer
Source§impl Vectorizer for CountVectorizer
impl Vectorizer for CountVectorizer
Auto Trait Implementations§
impl Freeze for CountVectorizer
impl !RefUnwindSafe for CountVectorizer
impl Send for CountVectorizer
impl Sync for CountVectorizer
impl Unpin for CountVectorizer
impl UnsafeUnpin for CountVectorizer
impl !UnwindSafe for CountVectorizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> Pointable for T
impl<T> Pointable for T
Source§impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
Source§fn to_subset(&self) -> Option<SS>
fn to_subset(&self) -> Option<SS>
The inverse inclusion map: attempts to construct
self from the equivalent element of its
superset. Read moreSource§fn is_in_subset(&self) -> bool
fn is_in_subset(&self) -> bool
Checks if
self is actually part of its subset T (and can be converted to it).Source§fn to_subset_unchecked(&self) -> SS
fn to_subset_unchecked(&self) -> SS
Use with care! Same as
self.to_subset but without any property checks. Always succeeds.Source§fn from_subset(element: &SS) -> SP
fn from_subset(element: &SS) -> SP
The inclusion map: converts
self to the equivalent element of its superset.