Skip to main content

JsTokenizerBuilder

Struct JsTokenizerBuilder 

Source
pub struct JsTokenizerBuilder { /* private fields */ }
Expand description

Builder for creating a Tokenizer with custom configuration.

The builder pattern allows for fluent configuration of tokenizer parameters including dictionaries, modes, and filter pipelines.

Implementations§

Source§

impl JsTokenizerBuilder

Source

pub fn new() -> Result<Self>

Creates a new TokenizerBuilder with default configuration.

Source

pub fn from_file(&self, file_path: String) -> Result<JsTokenizerBuilder>

Loads configuration from a JSON file.

§Arguments
  • file_path - Path to the configuration file.
§Returns

A new TokenizerBuilder with the loaded configuration.

Source

pub fn set_mode(&mut self, mode: String) -> Result<()>

Sets the tokenization mode.

§Arguments
  • mode - Mode string (“normal” or “decompose”).
Source

pub fn set_dictionary(&mut self, path: String)

Sets the dictionary path or URI.

§Arguments
  • path - Path to the dictionary directory or embedded URI (e.g. “embedded://ipadic”).
Source

pub fn set_user_dictionary(&mut self, uri: String)

Sets the user dictionary URI.

§Arguments
  • uri - URI to the user dictionary.
Source

pub fn set_keep_whitespace(&mut self, keep_whitespace: bool)

Sets whether to keep whitespace in tokenization results.

§Arguments
  • keep_whitespace - If true, whitespace tokens will be included in results.
Source

pub fn append_character_filter( &mut self, kind: String, args: Option<Value>, ) -> Result<()>

Appends a character filter to the preprocessing pipeline.

§Arguments
  • kind - Type of character filter to add (e.g. “unicode_normalize”, “mapping”).
  • args - Optional filter arguments as a JSON-compatible object.
Source

pub fn append_token_filter( &mut self, kind: String, args: Option<Value>, ) -> Result<()>

Appends a token filter to the postprocessing pipeline.

§Arguments
  • kind - Type of token filter to add (e.g. “lowercase”, “japanese_stop_tags”).
  • args - Optional filter arguments as a JSON-compatible object.
Source

pub fn build(&self) -> Result<JsTokenizer>

Builds the tokenizer with the configured settings.

§Returns

A configured Tokenizer instance ready for use.

Trait Implementations§

Source§

impl FromNapiMutRef for JsTokenizerBuilder

Source§

unsafe fn from_napi_mut_ref( env: napi_env, napi_val: napi_value, ) -> Result<&'static mut Self>

Safety Read more
Source§

impl FromNapiRef for JsTokenizerBuilder

Source§

unsafe fn from_napi_ref( env: napi_env, napi_val: napi_value, ) -> Result<&'static Self>

Safety Read more
Source§

impl JavaScriptClassExt for JsTokenizerBuilder

Source§

fn into_instance<'scope>( self, env: &'scope Env, ) -> Result<ClassInstance<'scope, Self>>

Source§

fn into_reference(self, env: Env) -> Result<Reference<Self>>

Source§

fn instance_of<'env, V: JsValue<'env>>(env: &Env, value: &V) -> Result<bool>

Source§

impl ObjectFinalize for JsTokenizerBuilder

Source§

fn finalize(self, env: Env) -> Result<(), Error>

Source§

impl ToNapiValue for JsTokenizerBuilder

Source§

impl TypeName for &JsTokenizerBuilder

Source§

impl TypeName for &mut JsTokenizerBuilder

Source§

impl TypeName for JsTokenizerBuilder

Source§

impl ValidateNapiValue for &JsTokenizerBuilder

Source§

unsafe fn validate(env: napi_env, napi_val: napi_value) -> Result<napi_value>

Safety Read more
Source§

impl ValidateNapiValue for &mut JsTokenizerBuilder

Source§

unsafe fn validate(env: napi_env, napi_val: napi_value) -> Result<napi_value>

Safety Read more

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> ArchivePointee for T

Source§

type ArchivedMetadata = ()

The archived version of the pointer metadata for this type.
Source§

fn pointer_metadata( _: &<T as ArchivePointee>::ArchivedMetadata, ) -> <T as Pointee>::Metadata

Converts some archived metadata to the pointer metadata for itself.
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> JsValuesTupleIntoVec for T
where T: ToNapiValue,

Source§

impl<T> LayoutRaw for T

Source§

fn layout_raw(_: <T as Pointee>::Metadata) -> Result<Layout, LayoutError>

Returns the layout of the type.
Source§

impl<T, N1, N2> Niching<NichedOption<T, N1>> for N2
where T: SharedNiching<N1, N2>, N1: Niching<T>, N2: Niching<T>,

Source§

unsafe fn is_niched(niched: *const NichedOption<T, N1>) -> bool

Returns whether the given value has been niched. Read more
Source§

fn resolve_niched(out: Place<NichedOption<T, N1>>)

Writes data to out indicating that a T is niched.
Source§

impl<T> Pointee for T

Source§

type Metadata = ()

The metadata type for pointers and references to this type.
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V

Source§

impl<T> SendAlias for T

Source§

impl<T> SendSyncUnwindSafe for T
where T: Send + Sync + UnwindSafe + ?Sized,

Source§

impl<T> SyncAlias for T