pub struct InferenceResponse {
pub request_id: RequestId,
pub text: String,
pub tokens: Vec<TokenId>,
pub finish_reason: FinishReason,
pub usage: TokenUsage,
pub latency_ms: u64,
pub created_at: DateTime<Utc>,
pub metadata: HashMap<String, Value>,
}Expand description
Inference response
Fields§
§request_id: RequestIdRequest ID this response corresponds to
text: StringGenerated text
tokens: Vec<TokenId>Generated token IDs
finish_reason: FinishReasonReason for completion
usage: TokenUsageToken usage statistics
latency_ms: u64Total latency in milliseconds
created_at: DateTime<Utc>Response creation timestamp
metadata: HashMap<String, Value>Additional response metadata
Trait Implementations§
Source§impl Clone for InferenceResponse
impl Clone for InferenceResponse
Source§fn clone(&self) -> InferenceResponse
fn clone(&self) -> InferenceResponse
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for InferenceResponse
impl Debug for InferenceResponse
Source§impl<'de> Deserialize<'de> for InferenceResponse
impl<'de> Deserialize<'de> for InferenceResponse
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for InferenceResponse
impl RefUnwindSafe for InferenceResponse
impl Send for InferenceResponse
impl Sync for InferenceResponse
impl Unpin for InferenceResponse
impl UnsafeUnpin for InferenceResponse
impl UnwindSafe for InferenceResponse
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more