oxillama-server 0.1.3

OpenAI-compatible HTTP API server for OxiLLaMa
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
//! Admin API statistics snapshot.

/// A snapshot of server-wide metrics for the admin stats endpoint.
#[derive(Debug, Clone, serde::Serialize)]
pub struct AdminStats {
    /// Total requests received (across all endpoints).
    pub requests_total: u64,
    /// Total generated tokens across all requests.
    pub tokens_generated_total: u64,
    /// Total prompt tokens received.
    pub prompt_tokens_total: u64,
    /// Number of currently in-flight requests.
    pub active_requests: u64,
    /// Current depth of the inference queue.
    pub queue_depth: u64,
}