Struct Detector

Source
pub struct Detector<'m, H: RealHasher> {
    pub languages: HashSet<ScriptLanguage, H>,
    pub long_text_minlen: usize,
    /* private fields */
}

Fields§

§languages: HashSet<ScriptLanguage, H>§long_text_minlen: usize

Implementations§

Source§

impl<'m, H: RealHasher> Detector<'m, H>

Source

pub fn clone_with_languages<H2: RealHasher>( &self, languages: HashSet<ScriptLanguage, H2>, ) -> Detector<'m, H2>

Clone detector with new languages selected

Source

pub fn preload_models(&self)

Preloads models for the languages selected in this detector

Source

pub fn unload_models(&self)

Drops all models loaded

Source

pub fn probabilities(&self, text: &str) -> Vec<(ScriptLanguage, f64)>

Returns probabilities for the provided text. Each value is a logarithmic probability between a negative infinity and 0.0.

Result is sorted by probabilities in a descending order.

If only a single language is identified by alphabet_detector, the value 0.0 will be returned.

Source

pub fn probabilities_relative(&self, text: &str) -> Vec<(ScriptLanguage, f64)>

Returns probabilities for the provided text relative to other languages. Each value is a number between 0.0 and 1.0.

If only a single language is identified by alphabet_detector, the value 1.0 will be returned.

Source

pub fn detect_top_one_or_none( &self, text: &str, minimum_distance: f64, ) -> Option<ScriptLanguage>

Detects a top one language of the provided text.

minimum_distance is a distance between a first and a second logarithmic probabilities, which can help filter languages with close probabilities.

If a single language cannot be returned, None is returned.

Source

pub fn detect_top_one_reordered_custom<F>( &self, text: &str, reorder_distance_compute: F, ) -> Option<ScriptLanguage>
where F: FnOnce(Vec<Word<Vec<char>>>) -> f64,

Detects a top one language of the provided text. If multiple languages are covered by reorder distance (result of reorder_distance_compute), reorders by total speakers of these languages.

Reorder distance is a distance between logarithmic probabilities, must be >= 0.0.

None is returned only when probabilities is empty.

Source

pub fn detect_top_one_reordered(&self, text: &str) -> Option<ScriptLanguage>

Detects a top one language of the provided text. If multiple languages are covered by the reorder formula, reorders by total speakers of these languages. More sutable if you need better detection of common (more popular) languages.

None is returned only when probabilities is empty.

Source

pub fn detect_top_one_raw(&self, text: &str) -> Option<ScriptLanguage>

Detects a top one language of the provided text. More sutable if you need better detection of rare (less popular) languages.

None is returned only when probabilities is empty.

Source

pub fn detect_top_one( &self, text: &str, reorder: bool, ) -> Option<ScriptLanguage>

Trait Implementations§

Source§

impl<'m, H: Clone + RealHasher> Clone for Detector<'m, H>

Source§

fn clone(&self) -> Detector<'m, H>

Returns a duplicate of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl<'m, H: Debug + RealHasher> Debug for Detector<'m, H>

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl<'m, H> Freeze for Detector<'m, H>
where H: Freeze,

§

impl<'m, H> !RefUnwindSafe for Detector<'m, H>

§

impl<'m, H> Send for Detector<'m, H>
where H: Send,

§

impl<'m, H> Sync for Detector<'m, H>
where H: Sync,

§

impl<'m, H> Unpin for Detector<'m, H>
where H: Unpin,

§

impl<'m, H> !UnwindSafe for Detector<'m, H>

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dest. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T> Instrument for T

Source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
Source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T> Same for T

Source§

type Output = T

Should always be Self
Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<T> WithSubscriber for T

Source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

impl<T> ErasedDestructor for T
where T: 'static,