tkach 0.5.0 - Docs.rs

//! Streaming primitives.
//!
//! `complete()` returns a buffered final answer; `stream()` returns the
//! same answer as a sequence of events as the model produces them. The
//! event types are deliberately coarser than the wire format — we
//! aggregate provider-side delta JSON into atomic `ToolUse` events
//! before emitting, so consumers never have to parse partial JSON.
//!
//! The stream item type is `Result<StreamEvent, ProviderError>`. Errors
//! that surface mid-stream (parser failures, mid-body HTTP glitches)
//! arrive as `Err`. Errors that happen before the stream starts
//! (auth, malformed request, connect refused) are returned by the
//! `stream(...)` async fn itself.

use std::pin::Pin;

use futures::stream::Stream;
use serde_json::Value;

use crate::error::ProviderError;
use crate::message::{StopReason, ThinkingMetadata, ThinkingProvider, Usage};
use crate::mode::ModeAuthority;
use crate::prompt_policy::PolicyId;
use crate::steering::TurnId;
use crate::tool::ToolClass;

/// One unit of progress from a streaming provider.
///
/// `ContentDelta` arrives in many small chunks during generation.
/// `ToolUse` is **atomic** — provider-side `input_json_delta` fragments
/// are accumulated by our parser and emitted only when the block
/// closes, so the consumer never has to handle partial JSON.
/// `MessageDelta` carries the final `stop_reason`. `Usage` typically
/// arrives once at the end. `Done` is the terminal marker.
#[derive(Debug, Clone)]
pub enum StreamEvent {
    /// Agent-level event fired when a new turn starts.
    TurnStarted { turn_id: TurnId },

    /// Agent-level event fired when an operator-applied mode changes immediately
    /// or an agent-requested mode is applied at a turn edge.
    ModeChanged {
        from: String,
        to: String,
        authority: ModeAuthority,
    },

    /// Agent-level event fired when an agent-authority mode change is queued.
    ModeChangeRequested {
        from: String,
        to: String,
        requested_at: TurnId,
    },

    /// Agent-level event fired when a continuation guard injects a prompt.
    ContinuationInjected { guard_name: String, iteration: u32 },

    /// Agent-level event fired when a continuation guard aborts or panics.
    GuardAborted { guard_name: String, reason: String },

    /// Agent-level event fired when a prompt policy is installed.
    PolicyInstalled { policy_id: PolicyId },

    /// Agent-level event fired when a prompt policy is removed.
    PolicyRemoved { policy_id: PolicyId },

    /// Agent-level event fired when prompt policies are added to a provider request.
    PolicyApplied {
        turn_id: TurnId,
        policy_ids: Vec<PolicyId>,
    },

    /// A piece of assistant text. Concatenate in order to reconstruct
    /// the full reply.
    ContentDelta(String),

    /// A piece of provider-visible thinking/reasoning summary text.
    ///
    /// This is not raw hidden chain-of-thought. Providers should emit
    /// this only for reasoning content the API explicitly returns and
    /// the provider adapter has chosen to expose.
    ThinkingDelta { text: String },

    /// A finalized thinking/reasoning block with provider replay state.
    ///
    /// `ThinkingDelta` is for live UI progress; `ThinkingBlock` is for
    /// preserving a complete block in [`crate::Content`] so callers can
    /// replay sessions without mixing thinking into visible answer text.
    ThinkingBlock {
        text: String,
        provider: ThinkingProvider,
        metadata: ThinkingMetadata,
    },

    /// A complete tool invocation request. The agent loop will execute
    /// it and feed the result back on the next turn.
    ToolUse {
        id: String,
        name: String,
        input: Value,
    },

    /// **Agent-level event** (not emitted by providers).
    ///
    /// Fired by `Agent::stream` after a `ToolUse` has been received and
    /// the model's turn has ended, **before** the executor's
    /// approval/policy gates run. Lets the consumer's UI render a
    /// "tool waiting for approval" prompt while
    /// [`ApprovalHandler::approve`](crate::ApprovalHandler::approve)
    /// blocks on user input.
    ///
    /// Order per tool call: `ToolUse{...}` → `ToolCallPending{...}`
    /// → handler returns Allow/Deny → tool runs (or denial result
    /// lands in next user turn). The actual decision flows through
    /// `ApprovalHandler`, not through this event.
    ///
    /// Only emitted by streaming runs; `Agent::run` (buffered) reaches
    /// the user only via the handler's blocking `approve()` call.
    ToolCallPending {
        id: String,
        name: String,
        input: Value,
        class: ToolClass,
    },

    /// Final stop reason from the provider for this turn.
    MessageDelta { stop_reason: StopReason },

    /// Token usage for this turn. Some providers emit it only at the
    /// end (Anthropic), others split input/output across events.
    Usage(Usage),

    /// Stream terminated normally. No more events will follow.
    Done,
}

/// Boxed, object-safe stream of provider events. Used as the return
/// payload of `LlmProvider::stream`.
pub type ProviderEventStream =
    Pin<Box<dyn Stream<Item = Result<StreamEvent, ProviderError>> + Send>>;