Struct TokenBudget

Source

pub struct TokenBudget {Show 14 fields
    pub max_context_tokens: u32,
    pub max_output_tokens: u32,
    pub strategy: BudgetStrategy,
    pub safety_margin: u32,
    pub compression_trigger_percent: u8,
    pub compression_target_percent: u8,
    pub working_reserve_tokens: u32,
    pub fallback_trigger_percent: u8,
    pub prompt_cache_min_tool_output_chars: u32,
    pub prompt_cache_head_chars: u32,
    pub prompt_cache_tail_chars: u32,
    pub prompt_cache_recent_user_turns: u8,
    pub prompt_cache_recent_tool_chains: u8,
    pub max_tool_output_tokens: u32,
}

Expand description

Token budget configuration for a conversation.

Fields§

§max_context_tokens: u32

Maximum context window size for the model (input + output)

§max_output_tokens: u32

Maximum tokens reserved for model output

§strategy: BudgetStrategy

Budget enforcement strategy

§safety_margin: u32

Safety margin for tokenizer estimation errors

§compression_trigger_percent: u8

Proactive compression trigger threshold as a percentage of context window tokens.

Legacy field — only used when working_reserve_tokens == 0.

§compression_target_percent: u8

Compression target threshold as a percentage of context window tokens.

§working_reserve_tokens: u32

Fixed number of input tokens kept free before the request hard limit.

Compression triggers when (max_context_tokens - working_reserve_tokens) is exceeded, but never later than the request input limit after reserving max_output_tokens and safety_margin. This provides consistent working space regardless of model context window size (Claude Code uses ~50K).

When working_reserve_tokens == 0, falls back to percentage-based triggering via compression_trigger_percent for backward compatibility.

§fallback_trigger_percent: u8

Fallback percentage trigger when the context window is too small for the fixed reserve (i.e. max_context_tokens < working_reserve_tokens * 2).

§prompt_cache_min_tool_output_chars: u32

Minimum tool output character length required before prompt-side cache compaction.

§prompt_cache_head_chars: u32

Leading excerpt length (chars) kept in cached tool output summaries.

§prompt_cache_tail_chars: u32

Trailing excerpt length (chars) kept in cached tool output summaries.

§prompt_cache_recent_user_turns: u8

Number of latest user turns protected from prompt-side cache compaction.

§prompt_cache_recent_tool_chains: u8

Number of latest tool call chains protected from prompt-side cache compaction.

§max_tool_output_tokens: u32

Maximum tokens allowed per single tool output. 0 = use byte-based fallback only.

Struct TokenBudget Copy item path

Fields§

Implementations§

impl TokenBudget

pub fn new( max_context_tokens: u32, max_output_tokens: u32, strategy: BudgetStrategy, ) -> TokenBudget

pub fn with_safety_margin( max_context_tokens: u32, max_output_tokens: u32, strategy: BudgetStrategy, safety_margin: u32, ) -> TokenBudget

pub fn max_request_input_tokens(&self) -> u32

pub fn compression_trigger_context_tokens(&self) -> u32

pub fn compression_target_context_tokens(&self) -> u32

pub fn for_model(max_context_tokens: u32) -> TokenBudget

Trait Implementations§

impl Clone for TokenBudget

fn clone(&self) -> TokenBudget

fn clone_from(&mut self, source: &Self)

impl Debug for TokenBudget

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

impl Default for TokenBudget

fn default() -> TokenBudget

impl<'de> Deserialize<'de> for TokenBudget

fn deserialize<__D>( __deserializer: __D, ) -> Result<TokenBudget, <__D as Deserializer<'de>>::Error>where __D: Deserializer<'de>,

impl Serialize for TokenBudget

fn serialize<__S>( &self, __serializer: __S, ) -> Result<<__S as Serializer>::Ok, <__S as Serializer>::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for TokenBudget

impl RefUnwindSafe for TokenBudget

impl Send for TokenBudget

impl Sync for TokenBudget

impl Unpin for TokenBudget

impl UnsafeUnpin for TokenBudget

impl UnwindSafe for TokenBudget

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct TokenBudget

fn deserialize<D>( deserializer: D, ) -> Result<TokenBudget, <D as Deserializer<'de>>::Error>
where __D: Deserializer<'de>,

fn serialize<S>( &self, serializer: S, ) -> Result<<S as Serializer>::Ok, <S as Serializer>::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,