Struct Segmenter

Source

pub struct Segmenter {
    pub mode: Mode,
    pub dictionary: Dictionary,
    pub user_dictionary: Option<UserDictionary>,
    pub keep_whitespace: bool,
    /* private fields */
}

Expand description

Segmenter

Fields§

§mode: Mode

The segmentation mode to be used by the segmenter. This determines how the text will be split into segments.

§dictionary: Dictionary

The dictionary used for segmenting text. This dictionary contains the necessary data structures and algorithms to perform morphological analysis and tokenization.

§user_dictionary: Option<UserDictionary>

An optional user-defined dictionary that can be used to customize the segmentation process. If provided, this dictionary will be used in addition to the default dictionary to improve the accuracy of segmentation for specific words or phrases.

§keep_whitespace: bool

Keep whitespace tokens in output.

When false (default), whitespace is ignored for MeCab compatibility. When true, whitespace tokens are included in the output.

Struct Segmenter Copy item path

Fields§

Implementations§

impl Segmenter

pub fn new( mode: Mode, dictionary: Dictionary, user_dictionary: Option<UserDictionary>, ) -> Self

§Arguments

§Returns

§Details

pub fn keep_whitespace(self, keep_whitespace: bool) -> Self

§Arguments

§Example

pub fn from_config(config: &SegmenterConfig) -> LinderaResult<Self>

§Methods

§Errors

pub fn segment<'a>( &'a self, text: Cow<'a, str>, ) -> LinderaResult<Vec<Token<'a>>>

§Arguments

§Returns

§Process

§Notes

§Example Flow

§Errors

pub fn segment_with_lattice<'a>( &'a self, text: Cow<'a, str>, lattice: &mut Lattice, ) -> LinderaResult<Vec<Token<'a>>>

§Arguments

§Returns

§Process

§Notes

§Example Flow

§Errors

pub fn segment_nbest<'a>( &'a self, text: Cow<'a, str>, n: usize, unique: bool, cost_threshold: Option<i64>, ) -> LinderaResult<Vec<(Vec<Token<'a>>, i64)>>

pub fn segment_nbest_with_lattice<'a>( &'a self, text: Cow<'a, str>, lattice: &mut Lattice, n: usize, unique: bool, cost_threshold: Option<i64>, ) -> LinderaResult<Vec<(Vec<Token<'a>>, i64)>>

Trait Implementations§

impl Clone for Segmenter

fn clone(&self) -> Segmenter

fn clone_from(&mut self, source: &Self)

Auto Trait Implementations§

impl Freeze for Segmenter

impl RefUnwindSafe for Segmenter

impl Send for Segmenter

impl Sync for Segmenter

impl Unpin for Segmenter

impl UnwindSafe for Segmenter

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> ArchivePointee for T

type ArchivedMetadata = ()

fn pointer_metadata( _: &<T as ArchivePointee>::ArchivedMetadata, ) -> <T as Pointee>::Metadata

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> LayoutRaw for T

fn layout_raw(_: <T as Pointee>::Metadata) -> Result<Layout, LayoutError>

impl<T, N1, N2> Niching<NichedOption<T, N1>> for N2where T: SharedNiching<N1, N2>, N1: Niching<T>, N2: Niching<T>,

unsafe fn is_niched(niched: *const NichedOption<T, N1>) -> bool

fn resolve_niched(out: Place<NichedOption<T, N1>>)

impl<T> Pointee for T

type Metadata = ()

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct Segmenter

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, N1, N2> Niching<NichedOption<T, N1>> for N2
where T: SharedNiching<N1, N2>, N1: Niching<T>, N2: Niching<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,