pub struct CountVectorizer { /* private fields */ }
Expand description
Count vectorizer for converting text documents to term frequency vectors
Implementations§
Source§impl CountVectorizer
impl CountVectorizer
Sourcepub fn with_max_features(self, maxfeatures: usize) -> Self
pub fn with_max_features(self, maxfeatures: usize) -> Self
Set maximum number of features
Sourcepub fn with_min_df(self, mindf: f64) -> Self
pub fn with_min_df(self, mindf: f64) -> Self
Set minimum document frequency
Sourcepub fn with_max_df(self, maxdf: f64) -> Self
pub fn with_max_df(self, maxdf: f64) -> Self
Set maximum document frequency
Sourcepub fn with_lowercase(self, lowercase: bool) -> Self
pub fn with_lowercase(self, lowercase: bool) -> Self
Set whether to convert to lowercase
Sourcepub fn with_token_pattern(self, pattern: &str) -> Result<Self>
pub fn with_token_pattern(self, pattern: &str) -> Result<Self>
Set custom token pattern
Sourcepub fn with_stop_words(self, stopwords: Vec<String>) -> Self
pub fn with_stop_words(self, stopwords: Vec<String>) -> Self
Set stop words
Sourcepub fn fit(&mut self, documents: &[String]) -> Result<()>
pub fn fit(&mut self, documents: &[String]) -> Result<()>
Fit the vectorizer on a collection of documents
Sourcepub fn transform(&self, documents: &[String]) -> Result<Array2<f64>>
pub fn transform(&self, documents: &[String]) -> Result<Array2<f64>>
Transform documents to count vectors
Sourcepub fn fit_transform(&mut self, documents: &[String]) -> Result<Array2<f64>>
pub fn fit_transform(&mut self, documents: &[String]) -> Result<Array2<f64>>
Fit and transform in one step
Sourcepub fn get_feature_names(&self) -> &[String]
pub fn get_feature_names(&self) -> &[String]
Get feature names
Trait Implementations§
Auto Trait Implementations§
impl Freeze for CountVectorizer
impl RefUnwindSafe for CountVectorizer
impl Send for CountVectorizer
impl Sync for CountVectorizer
impl Unpin for CountVectorizer
impl UnwindSafe for CountVectorizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self
into a Left
variant of Either<Self, Self>
if into_left
is true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self
into a Left
variant of Either<Self, Self>
if into_left(&self)
returns true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> Pointable for T
impl<T> Pointable for T
Source§impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
Source§fn to_subset(&self) -> Option<SS>
fn to_subset(&self) -> Option<SS>
The inverse inclusion map: attempts to construct
self
from the equivalent element of its
superset. Read moreSource§fn is_in_subset(&self) -> bool
fn is_in_subset(&self) -> bool
Checks if
self
is actually part of its subset T
(and can be converted to it).Source§fn to_subset_unchecked(&self) -> SS
fn to_subset_unchecked(&self) -> SS
Use with care! Same as
self.to_subset
but without any property checks. Always succeeds.Source§fn from_subset(element: &SS) -> SP
fn from_subset(element: &SS) -> SP
The inclusion map: converts
self
to the equivalent element of its superset.