Struct linfa_preprocessing::tf_idf_vectorization::FittedTfIdfVectorizer[][src]

pub struct FittedTfIdfVectorizer { /* fields omitted */ }

Counts the occurrences of each vocabulary entry, learned during fitting, in a sequence of texts and scales them by the inverse document document frequency defined by the method. Each vocabulary entry is mapped to an integer value that is used to index the count in the result.

Implementations

impl FittedTfIdfVectorizer[src]

pub fn nentries(&self) -> usize[src]

Number of vocabulary entries learned during fitting

pub fn vocabulary(&self) -> &Vec<String>[src]

Constains all vocabulary entries, in the same order used by the transform method.

pub fn method(&self) -> &TfIdfMethod[src]

Returns the inverse document frequency method used in the tansform method

pub fn transform<T: ToString, D: Data<Elem = T>>(
    &self,
    x: &ArrayBase<D, Ix1>
) -> CsMat<f64>
[src]

Given a sequence of n documents, produces an array of size (n, vocabulary_entries) where column j of row i is the number of occurrences of vocabulary entry j in the text of index i, scaled by the inverse document frequency. Vocabulary entry j is the string at the j-th position in the vocabulary.

pub fn transform_files<P: AsRef<Path>>(
    &self,
    input: &[P],
    encoding: EncodingRef,
    trap: DecoderTrap
) -> CsMat<f64>
[src]

Auto Trait Implementations

Blanket Implementations

impl<T> Any for T where
    T: 'static + ?Sized
[src]

impl<T> Borrow<T> for T where
    T: ?Sized
[src]

impl<T> BorrowMut<T> for T where
    T: ?Sized
[src]

impl<T> From<T> for T[src]

impl<T, U> Into<U> for T where
    U: From<T>, 
[src]

impl<T, U> TryFrom<U> for T where
    U: Into<T>, 
[src]

type Error = Infallible

The type returned in the event of a conversion error.

impl<T, U> TryInto<U> for T where
    U: TryFrom<T>, 
[src]

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.

impl<V, T> VZip<V> for T where
    V: MultiLane<T>,