Struct HeuristicTokenCounter

Source

pub struct HeuristicTokenCounter { /* private fields */ }

Expand description

A provider-agnostic TokenCounter that approximates token counts from UTF-8 byte lengths.

This is intended as a zero-dependency default. It is not a substitute for a tokenizer and will under- or over-count by up to ~30 % on real content, but it is monotonic in message size and stable across runs, which is enough for TokenWindowMemory to enforce a budget that trends with provider billing.

§Strategy

For every text-bearing block (Text, reasoning text, tool-result text) the counter sums UTF-8 byte lengths (str::len, an O(1) call) and divides by bytes_per_token, rounded up. Bytes are used instead of Unicode scalars because the cost is O(1), modern BPE tokenizers operate on byte sequences, and per-message budgeting only needs the rough order of magnitude. For ASCII text bytes and characters coincide; for non-ASCII text the counter slightly over-estimates, which is the safe direction for a hard budget.

Tool calls are charged the JSON-serialised length of their ToolFunction payload. Each message is charged a flat per_message_overhead to model the per-turn role/separator tokens that providers add internally. Non-text blocks (images, audio, video, documents) are charged per_attachment_tokens each because their real cost is provider-specific and rarely text-derived.

§Presets

The defaults match OpenAI’s published rule of thumb (~4 bytes per token, ~4 tokens of per-message overhead). HeuristicTokenCounter::anthropic uses a slightly denser ratio that better fits Claude’s tokenizer.

§Example

use rig_memory::{HeuristicTokenCounter, TokenWindowMemory};

let policy = TokenWindowMemory::new(2_000, HeuristicTokenCounter::default());

Struct HeuristicTokenCounter Copy item path

§Strategy

§Presets

§Example

Implementations§

impl HeuristicTokenCounter

pub fn new( bytes_per_token: f32, per_message_overhead: usize, per_attachment_tokens: usize, ) -> Self

pub fn openai() -> Self

pub fn anthropic() -> Self

pub fn gemini() -> Self

Trait Implementations§

impl Clone for HeuristicTokenCounter

fn clone(&self) -> HeuristicTokenCounter

fn clone_from(&mut self, source: &Self)

impl Debug for HeuristicTokenCounter

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for HeuristicTokenCounter

fn default() -> Self

impl TokenCounter for HeuristicTokenCounter

fn count(&self, message: &Message) -> usize

impl Copy for HeuristicTokenCounter

Auto Trait Implementations§

impl Freeze for HeuristicTokenCounter

impl RefUnwindSafe for HeuristicTokenCounter

impl Send for HeuristicTokenCounter

impl Sync for HeuristicTokenCounter

impl Unpin for HeuristicTokenCounter

impl UnsafeUnpin for HeuristicTokenCounter

impl UnwindSafe for HeuristicTokenCounter

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DynClone for Twhere T: Clone,

fn __clone_box(&self, _: Private) -> *mut ()

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DTwhere ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DTwhere ST: ?Sized, DT: ?Sized,

impl<T> Read<Exclusive, BecauseExclusive> for Twhere T: ?Sized,

impl<T> WasmCompatSend for Twhere T: Send,

impl<T> WasmCompatSync for Twhere T: Sync,

Struct HeuristicTokenCounter

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DynClone for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DT
where ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DT
where ST: ?Sized, DT: ?Sized,

impl<T> Read<Exclusive, BecauseExclusive> for T
where T: ?Sized,

impl<T> WasmCompatSend for T
where T: Send,

impl<T> WasmCompatSync for T
where T: Sync,