pub struct TfidfVectorizer { /* private fields */ }Expand description
TF-IDF vectorizer that computes term frequency-inverse document frequency
Implementations§
Source§impl TfidfVectorizer
impl TfidfVectorizer
Sourcepub fn new(binary: bool, smoothidf: bool, norm: Option<String>) -> Self
pub fn new(binary: bool, smoothidf: bool, norm: Option<String>) -> Self
Create a new TF-IDF vectorizer
Sourcepub fn with_tokenizer(
tokenizer: Box<dyn Tokenizer + Send + Sync>,
binary: bool,
smoothidf: bool,
norm: Option<String>,
) -> Self
pub fn with_tokenizer( tokenizer: Box<dyn Tokenizer + Send + Sync>, binary: bool, smoothidf: bool, norm: Option<String>, ) -> Self
Create a TF-IDF vectorizer with a custom tokenizer
Sourcepub fn vocabulary(&self) -> &Vocabulary
pub fn vocabulary(&self) -> &Vocabulary
Get a reference to the vocabulary
Sourcepub fn vocabulary_size(&self) -> usize
pub fn vocabulary_size(&self) -> usize
Get the vocabulary size
Sourcepub fn get_feature_score(
&self,
matrix: &Array2<f64>,
document_index: usize,
feature_index: usize,
) -> Option<f64>
pub fn get_feature_score( &self, matrix: &Array2<f64>, document_index: usize, feature_index: usize, ) -> Option<f64>
Get TF-IDF score for a specific document and feature index from a matrix
Sourcepub fn vocabulary_map(&self) -> HashMap<String, usize>
pub fn vocabulary_map(&self) -> HashMap<String, usize>
Get vocabulary as HashMap for compatibility with visualization
Trait Implementations§
Source§impl Clone for TfidfVectorizer
impl Clone for TfidfVectorizer
Source§fn clone(&self) -> TfidfVectorizer
fn clone(&self) -> TfidfVectorizer
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Default for TfidfVectorizer
impl Default for TfidfVectorizer
Source§impl Vectorizer for TfidfVectorizer
impl Vectorizer for TfidfVectorizer
Auto Trait Implementations§
impl Freeze for TfidfVectorizer
impl !RefUnwindSafe for TfidfVectorizer
impl Send for TfidfVectorizer
impl Sync for TfidfVectorizer
impl Unpin for TfidfVectorizer
impl UnsafeUnpin for TfidfVectorizer
impl !UnwindSafe for TfidfVectorizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> Pointable for T
impl<T> Pointable for T
Source§impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
Source§fn to_subset(&self) -> Option<SS>
fn to_subset(&self) -> Option<SS>
The inverse inclusion map: attempts to construct
self from the equivalent element of its
superset. Read moreSource§fn is_in_subset(&self) -> bool
fn is_in_subset(&self) -> bool
Checks if
self is actually part of its subset T (and can be converted to it).Source§fn to_subset_unchecked(&self) -> SS
fn to_subset_unchecked(&self) -> SS
Use with care! Same as
self.to_subset but without any property checks. Always succeeds.Source§fn from_subset(element: &SS) -> SP
fn from_subset(element: &SS) -> SP
The inclusion map: converts
self to the equivalent element of its superset.