Struct TokenCounter

Source

pub struct TokenCounter { /* private fields */ }

Expand description

Token counter using the GPT-4 tokenizer for accurate token counting.

Provides methods for counting tokens in text and truncating content to fit within specified token limits while maintaining text coherence.

§Examples

use ai_context_gen::token_counter::TokenCounter;

let counter = TokenCounter::new().unwrap();
let text = "Hello, world!";
let token_count = counter.count_tokens(text);
println!("Text has {} tokens", token_count);

Implementations§

Source §

impl TokenCounter

Source

pub fn new() -> Result<Self>

Creates a new token counter using the GPT-4 tokenizer.

§Returns

A new TokenCounter instance configured with the GPT-4 BPE tokenizer.

§Errors

Returns an error if the GPT-4 tokenizer model cannot be loaded.

§Examples

use ai_context_gen::token_counter::TokenCounter;

let counter = TokenCounter::new().unwrap();

Source

pub fn count_tokens(&self, text: &str) -> usize

Counts the number of tokens in the given text.

Uses the GPT-4 tokenizer to provide accurate token counts that match what would be used by OpenAI’s models and similar systems.

§Arguments

text - The text to count tokens for

§Returns

The number of tokens in the text.

§Examples

use ai_context_gen::token_counter::TokenCounter;

let counter = TokenCounter::new().unwrap();
let count = counter.count_tokens("Hello, world!");
assert!(count > 0);

Source

pub fn truncate_to_token_limit(&self, text: &str, max_tokens: usize) -> String

Truncates text to fit within a specified token limit.

Attempts to preserve text coherence by truncating at token boundaries rather than character boundaries. Falls back to character truncation if token decoding fails.

§Arguments

text - The text to truncate
max_tokens - Maximum number of tokens to include

§Returns

The truncated text that fits within the token limit.

§Examples

use ai_context_gen::token_counter::TokenCounter;

let counter = TokenCounter::new().unwrap();
let long_text = "This is a very long text that exceeds the token limit...";
let truncated = counter.truncate_to_token_limit(long_text, 10);
assert!(counter.count_tokens(&truncated) <= 10);

Auto Trait Implementations§

§

impl UnwindSafe for TokenCounter

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct TokenCounter

§Examples

Implementations§

impl TokenCounter

pub fn new() -> Result<Self>

§Returns

§Errors

§Examples

pub fn count_tokens(&self, text: &str) -> usize

§Arguments

§Returns

§Examples

pub fn truncate_to_token_limit(&self, text: &str, max_tokens: usize) -> String

§Arguments

§Returns

§Examples

Auto Trait Implementations§

impl Freeze for TokenCounter

impl RefUnwindSafe for TokenCounter

impl Send for TokenCounter

impl Sync for TokenCounter

impl Unpin for TokenCounter

impl UnwindSafe for TokenCounter

Blanket Implementations§

impl<T> Any for T
where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T
where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T
where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T
where U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for T
where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct TokenCounterCopy item path

§Examples

Implementations§

impl TokenCounter

pub fn new() -> Result<Self>

§Returns

§Errors

§Examples

pub fn count_tokens(&self, text: &str) -> usize

§Arguments

§Returns

§Examples

pub fn truncate_to_token_limit(&self, text: &str, max_tokens: usize) -> String

§Arguments

§Returns

§Examples

Auto Trait Implementations§

impl Freeze for TokenCounter

impl RefUnwindSafe for TokenCounter

impl Send for TokenCounter

impl Sync for TokenCounter

impl Unpin for TokenCounter

impl UnwindSafe for TokenCounter

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct TokenCounter

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,