use std::borrow::Borrow;
use prelude::{NaiveDocument, NormalizationFactor, ProcessedDocument, Tf};
#[derive(Copy, Clone)]
pub struct BinaryTf;
impl<T> Tf<T> for BinaryTf
where
T: NaiveDocument,
{
#[inline]
fn tf<K>(term: K, doc: &T) -> f64
where
K: Borrow<T::Term>,
{
if doc.term_exists(term) {
1f64
} else {
0f64
}
}
}
#[derive(Copy, Clone)]
pub struct RawFrequencyTf(f64);
impl<T> Tf<T> for RawFrequencyTf
where
T: ProcessedDocument,
{
#[inline]
fn tf<K>(term: K, doc: &T) -> f64
where
K: Borrow<T::Term>,
{
doc.term_frequency(term) as f64
}
}
#[derive(Copy, Clone)]
pub struct LogNormalizationTf;
impl<T> Tf<T> for LogNormalizationTf
where
T: ProcessedDocument,
{
#[inline]
fn tf<K>(term: K, doc: &T) -> f64
where
K: Borrow<T::Term>,
{
1f64 + (doc.term_frequency(term) as f64).ln()
}
}
pub trait DoubleKNormalizationTf: NormalizationFactor {}
impl<T, S> Tf<T> for S
where
S: DoubleKNormalizationTf,
T: ProcessedDocument,
{
#[inline]
fn tf<K>(term: K, doc: &T) -> f64
where
K: Borrow<T::Term>,
{
let max = match doc.max() {
Some(m) => doc.term_frequency(m) as f64,
None => 1f64,
};
S::factor() + ((1f64 - S::factor()) * ((doc.term_frequency(term) as f64) / max))
}
}
#[derive(Copy, Clone)]
pub struct DoubleHalfNormalizationTf;
impl NormalizationFactor for DoubleHalfNormalizationTf {
#[inline]
fn factor() -> f64 {
0.5f64
}
}
impl DoubleKNormalizationTf for DoubleHalfNormalizationTf {}