[−][src]Struct punkt::TrainingData
Stores data that was obtained during training.
Examples
Precompiled data can be loaded via a language specific constructor.
let eng_data = TrainingData::english(); let ger_data = TrainingData::german(); assert!(eng_data.contains_abbrev("va")); assert!(ger_data.contains_abbrev("crz"));
Methods
impl TrainingData
[src]
pub fn new() -> TrainingData
[src]
Creates a new, empty data object.
pub fn contains_abbrev(&self, tok: &str) -> bool
[src]
Check if a token is considered to be an abbreviation.
pub fn contains_sentence_starter(&self, tok: &str) -> bool
[src]
Check if a token is considered to be a token that commonly starts a sentence.
pub fn contains_collocation(&self, left: &str, right: &str) -> bool
[src]
Checks if a pair of words are commonly known to appear together.
pub fn get_orthographic_context(&self, tok: &str) -> u8
[src]
Gets the orthographic context for a token. Returns 0 if the token was not yet encountered.
impl TrainingData
[src]
pub fn czech() -> TrainingData
[src]
impl TrainingData
[src]
pub fn danish() -> TrainingData
[src]
impl TrainingData
[src]
pub fn dutch() -> TrainingData
[src]
impl TrainingData
[src]
pub fn english() -> TrainingData
[src]
impl TrainingData
[src]
pub fn estonian() -> TrainingData
[src]
impl TrainingData
[src]
pub fn finnish() -> TrainingData
[src]
impl TrainingData
[src]
pub fn french() -> TrainingData
[src]
impl TrainingData
[src]
pub fn german() -> TrainingData
[src]
impl TrainingData
[src]
pub fn greek() -> TrainingData
[src]
impl TrainingData
[src]
pub fn italian() -> TrainingData
[src]
impl TrainingData
[src]
pub fn norwegian() -> TrainingData
[src]
impl TrainingData
[src]
pub fn polish() -> TrainingData
[src]
impl TrainingData
[src]
pub fn portuguese() -> TrainingData
[src]
impl TrainingData
[src]
pub fn slovene() -> TrainingData
[src]
impl TrainingData
[src]
pub fn spanish() -> TrainingData
[src]
impl TrainingData
[src]
pub fn swedish() -> TrainingData
[src]
impl TrainingData
[src]
pub fn turkish() -> TrainingData
[src]
Trait Implementations
impl Default for TrainingData
[src]
fn default() -> TrainingData
[src]
impl Debug for TrainingData
[src]
impl FromStr for TrainingData
[src]
Auto Trait Implementations
impl Send for TrainingData
impl Sync for TrainingData
Blanket Implementations
impl<T> From for T
[src]
impl<T, U> Into for T where
U: From<T>,
[src]
U: From<T>,
impl<T, U> TryFrom for T where
U: Into<T>,
[src]
U: Into<T>,
type Error = !
🔬 This is a nightly-only experimental API. (
try_from
)The type returned in the event of a conversion error.
fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>
[src]
impl<T> Borrow for T where
T: ?Sized,
[src]
T: ?Sized,
impl<T> Any for T where
T: 'static + ?Sized,
[src]
T: 'static + ?Sized,
impl<T> BorrowMut for T where
T: ?Sized,
[src]
T: ?Sized,
fn borrow_mut(&mut self) -> &mut T
[src]
impl<T, U> TryInto for T where
U: TryFrom<T>,
[src]
U: TryFrom<T>,