Struct InferenceResult

Source

pub struct InferenceResult {
    pub text: String,
    pub tool_calls: Vec<ToolCall>,
    pub bounding_boxes: Vec<BoundingBox>,
    pub trace_id: String,
    pub model_used: String,
    pub latency_ms: u64,
    pub time_to_first_token_ms: Option<u64>,
    pub usage: Option<TokenUsage>,
    pub provider_output_items: Vec<Value>,
}

Expand description

Result of an inference call, including trace ID for outcome tracking.

Fields§

§text: String

The generated text (empty if tool_calls are present).

§tool_calls: Vec<ToolCall>

Tool calls returned by the model (when tools were provided in the request).

§bounding_boxes: Vec<BoundingBox>

Structured bounding boxes when the model emitted Qwen2.5-VL grounding spans (<|box_*|>, <|object_ref_*|>) in its text. Parsed from the same text field — the raw span markers remain visible in text for callers that need to see them verbatim. Empty vec when the model didn’t ground anything (typical for non-VL models or prompts that only ask for description).

§trace_id: String

Trace ID for reporting outcomes back to the tracker.

§model_used: String

Which model was used.

§latency_ms: u64

Wall-clock latency in ms.

§time_to_first_token_ms: Option<u64>

Time to first token in milliseconds. Populated by the local generate paths (Candle/MLX) which observe the prefill→first-decode transition directly. None for paths that can’t measure it honestly without streaming — currently the non-streaming remote paths. Callers needing TTFT on remote models should use InferenceEngine::generate_tracked_stream and time the first text event arrival themselves.

Always serialized (as null when None) so downstream validation harnesses can distinguish “wasn’t measured” from “field doesn’t exist on this client’s protocol version”.

§usage: Option<TokenUsage>

Token usage statistics from the API response (None for local models).

§provider_output_items: Vec<Value>

Provider-specific output items the protocol emitted alongside the response — currently used by the OpenAI Responses API to return reasoning blobs, encrypted_content, web-search results, etc. as opaque structured items the next request must include verbatim. Empty for protocols that don’t emit them (Chat Completions, Anthropic, Gemini, all local backends).

Callers carry these between turns by emitting them as a tasks::generate::Message::ProviderOutputItems message in the next request. Builder paths that don’t recognize the originating protocol drop the variant — the items are protocol-specific and have no portable rendering.

Struct InferenceResult Copy item path

Fields§

Implementations§

impl InferenceResult

pub fn has_tool_calls(&self) -> bool

Trait Implementations§

impl Clone for InferenceResult

fn clone(&self) -> InferenceResult

fn clone_from(&mut self, source: &Self)

impl Debug for InferenceResult

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<'de> Deserialize<'de> for InferenceResult

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for InferenceResult

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for InferenceResult

impl RefUnwindSafe for InferenceResult

impl Send for InferenceResult

impl Sync for InferenceResult

impl Unpin for InferenceResult

impl UnsafeUnpin for InferenceResult

impl UnwindSafe for InferenceResult

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> PolicyExt for Twhere T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>where T: Policy<B, E>, P: Policy<B, E>,

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> ErasedDestructor for Twhere T: 'static,

Struct InferenceResult

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> PolicyExt for T
where T: ?Sized,

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T> ErasedDestructor for T
where T: 'static,