Struct TokenInterceptor

Source

pub struct TokenInterceptor {Show 20 fields
    pub provider: Provider,
    pub transform: Transform,
    pub model: String,
    pub token_count: usize,
    pub transformed_count: usize,
    pub visual_mode: bool,
    pub heatmap_mode: bool,
    pub orchestrator: bool,
    pub orchestrator_url: String,
    pub web_tx: Option<UnboundedSender<TokenEvent>>,
    pub web_provider_label: Option<String>,
    pub system_prompt: Option<String>,
    pub rate: f64,
    pub top_logprobs: u8,
    pub recorder: Option<Recorder>,
    pub json_stream: bool,
    pub min_confidence: Option<f64>,
    pub max_retries: u32,
    pub anthropic_max_tokens: u32,
    pub timeout_secs: Option<u64>,
    /* private fields */
}

Expand description

The core streaming engine that sits between the caller and the LLM.

TokenInterceptor manages the HTTP connection to the configured provider, iterates the server-sent-event (SSE) stream, applies the active Transform to every N-th token (controlled by rate), attaches per-token confidence and perplexity from API logprobs, and routes enriched TokenEvents to one of three output sinks:

Terminal — ANSI-colored text written to stdout.
Web UI — events sent over the web_tx unbounded channel for SSE fan-out.
JSON stream — one JSON line per token written to stdout (json_stream = true).

Construct with TokenInterceptor::new then call TokenInterceptor::intercept_stream.

Fields§

§provider: Provider§transform: Transform§model: String§token_count: usize§transformed_count: usize§visual_mode: bool§heatmap_mode: bool§orchestrator: bool§orchestrator_url: String§web_tx: Option<UnboundedSender<TokenEvent>>

When set, token events are sent here instead of printed to stdout.

§web_provider_label: Option<String>

When set, each emitted TokenEvent carries this provider label (for diff mode).

§system_prompt: Option<String>

Optional system prompt prepended to the conversation.

§rate: f64

Fraction of tokens to transform (0.0–1.0). Bresenham-spread so the distribution is deterministic and uniform rather than probabilistic.

§top_logprobs: u8

Number of top alternative tokens to request per position (OpenAI only, 0–20).

§recorder: Option<Recorder>

Optional replay recorder — records each emitted TokenEvent.

§json_stream: bool

When true, print one JSON line per token instead of colored text.

§min_confidence: Option<f64>

Minimum confidence threshold for transform gating. When set, only tokens with confidence at or below this value are transformed.

§max_retries: u32

Maximum retry attempts for API calls on 429/5xx (configurable via –max-retries).

§anthropic_max_tokens: u32

Maximum tokens in the Anthropic response (configurable via –anthropic-max-tokens).

§timeout_secs: Option<u64>

Optional stream timeout in seconds. When set, intercept_stream will fail with a timeout error if the entire stream does not complete within this duration.

TokenInterceptor

Struct TokenInterceptor Copy item path

Fields§

Implementations§

impl TokenInterceptor

pub fn new( provider: Provider, transform: Transform, model: String, visual_mode: bool, heatmap_mode: bool, orchestrator: bool, ) -> Result<Self, Box<dyn Error>>

§Errors

pub fn with_rate(self, rate: f64) -> Self

pub fn with_seed(self, seed: u64) -> Self

pub fn with_web_tx(self, tx: UnboundedSender<TokenEvent>) -> Self

pub fn with_provider_label(self, label: impl Into<String>) -> Self

pub fn with_system_prompt(self, prompt: impl Into<String>) -> Self

pub fn with_top_logprobs(self, n: u8) -> Self

pub fn with_json_stream(self, enabled: bool) -> Self

pub fn with_orchestrator_url(self, url: impl Into<String>) -> Self

pub fn with_max_retries(self, n: u32) -> Self

pub fn with_timeout(self, secs: u64) -> Self

pub fn with_min_confidence(self, threshold: f64) -> Self

pub async fn intercept_stream( &mut self, prompt: &str, ) -> Result<(), Box<dyn Error>>

§Errors

pub fn process_content(&mut self, content: &str)

pub fn process_content_with_logprob( &mut self, content: &str, lp: Option<OpenAILogprobContent>, )

pub fn process_content_logprob( &mut self, content: &str, log_prob: Option<f32>, top_alts: Vec<TokenAlternative>, )

pub fn print_header(&self, prompt: &str)

pub fn print_footer(&self)

Auto Trait Implementations§

impl Freeze for TokenInterceptor

impl !RefUnwindSafe for TokenInterceptor

impl Send for TokenInterceptor

impl Sync for TokenInterceptor

impl Unpin for TokenInterceptor

impl UnsafeUnpin for TokenInterceptor

impl !UnwindSafe for TokenInterceptor

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct TokenInterceptor

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,