pub struct HuggingFaceTokenizer { /* private fields */ }Expand description
HuggingFace tokenizer wrapper
Implementations§
Source§impl HuggingFaceTokenizer
impl HuggingFaceTokenizer
Sourcepub fn from_file(file_path: &str) -> Result<Self>
pub fn from_file(file_path: &str) -> Result<Self>
Create a tokenizer from a HuggingFace tokenizer JSON file
Sourcepub fn from_file_with_chat_template(
file_path: &str,
chat_template_path: Option<&str>,
) -> Result<Self>
pub fn from_file_with_chat_template( file_path: &str, chat_template_path: Option<&str>, ) -> Result<Self>
Create a tokenizer from a HuggingFace tokenizer JSON file with an optional chat template
Sourcepub fn from_tokenizer(tokenizer: HfTokenizer) -> Self
pub fn from_tokenizer(tokenizer: HfTokenizer) -> Self
Create from an existing HuggingFace tokenizer
Sourcepub fn set_chat_template(&mut self, template: String)
pub fn set_chat_template(&mut self, template: String)
Set or override the chat template
Sourcepub fn chat_template_content_format(&self) -> ChatTemplateContentFormat
pub fn chat_template_content_format(&self) -> ChatTemplateContentFormat
Get the content format expected by the chat template
Sourcepub fn apply_chat_template(
&self,
messages: &[Value],
params: ChatTemplateParams<'_>,
) -> Result<String>
pub fn apply_chat_template( &self, messages: &[Value], params: ChatTemplateParams<'_>, ) -> Result<String>
Apply chat template if available
Takes transformed JSON Values (already transformed based on content format)
Trait Implementations§
Source§impl Decoder for HuggingFaceTokenizer
impl Decoder for HuggingFaceTokenizer
Source§impl Encoder for HuggingFaceTokenizer
impl Encoder for HuggingFaceTokenizer
Source§impl Tokenizer for HuggingFaceTokenizer
impl Tokenizer for HuggingFaceTokenizer
fn vocab_size(&self) -> usize
fn get_special_tokens(&self) -> &SpecialTokens
fn token_to_id(&self, token: &str) -> Option<TokenIdType>
fn id_to_token(&self, id: TokenIdType) -> Option<String>
Auto Trait Implementations§
impl !Freeze for HuggingFaceTokenizer
impl RefUnwindSafe for HuggingFaceTokenizer
impl Send for HuggingFaceTokenizer
impl Sync for HuggingFaceTokenizer
impl Unpin for HuggingFaceTokenizer
impl UnwindSafe for HuggingFaceTokenizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more