List of all items
Structs
- config::BackendConfig
- config::BatchConfig
- config::EngineConfig
- config::EngineModelConfig
- config::KvCacheConfig
- config::MemoryConfig
- config::MonitoringConfig
- config::PaddingConfig
- config::SamplingConfig
- config::SchedulerConfig
- config::SecurityConfig
- config::TokenizerConfig
- config::TruncationConfig
- ids::BatchId
- ids::ClientId
- ids::ModelId
- ids::RequestId
- ids::SessionId
- ids::TaskId
- ids::TokenId
- metrics::AllocationInfo
- metrics::BatchingMetrics
- metrics::BuildInfo
- metrics::CacheStats
- metrics::ComponentHealth
- metrics::ComponentStatus
- metrics::DetailedResourceUsage
- metrics::DiagnosticsReport
- metrics::DiskMetrics
- metrics::EngineMetrics
- metrics::EngineRequestProgress
- metrics::EngineRequestState
- metrics::EngineState
- metrics::EngineStatus
- metrics::ErrorEvent
- metrics::ErrorStats
- metrics::GpuMemoryDetails
- metrics::GpuMetrics
- metrics::HardwareConstraints
- metrics::HealthStatus
- metrics::LatencyMetrics
- metrics::LatencyRequirements
- metrics::MemoryUsage
- metrics::ModelMetrics
- metrics::NetworkIODetails
- metrics::NetworkMetrics
- metrics::PerformanceAnalysis
- metrics::PerformanceBottleneck
- metrics::PerformanceBreakdown
- metrics::PerformanceRecommendation
- metrics::PerformanceTrends
- metrics::PhaseMetrics
- metrics::PrefixCacheStats
- metrics::QueueMetrics
- metrics::RequestCharacteristics
- metrics::RequestMetrics
- metrics::ResourceMetrics
- metrics::RuntimeInfo
- metrics::SchedulerStats
- metrics::SpeculationConfig
- metrics::SystemInfo
- metrics::SystemMetrics
- metrics::ThroughputMetrics
- metrics::WarmupResult
- models::AttentionConfig
- models::ModelConfig
- models::ModelInfo
- models::ModelMemoryRequirements
- models::RopeScaling
- models::TokenUsage
- requests::BatchRequest
- requests::InferenceRequest
- requests::InferenceResponse
- requests::ScheduledRequest
- requests::StreamChunk
- sampling::MirostatParams
- sampling::SamplingParams
- sampling::SamplingPresets
- sampling::SpecialTokens
Enums
- config::BackendType
- config::KvCacheType
- config::PaddingStrategy
- config::SchedulingPolicy
- config::TokenizerType
- config::TruncationStrategy
- devices::DataType
- devices::Device
- errors::FerrumError
- metrics::HealthStatusType
- metrics::TrendDirection
- models::Activation
- models::ModelSource
- models::ModelType
- models::NormType
- models::QuantizationConfig
- requests::RequestState
- sampling::FinishReason
- sampling::Priority
- sampling::ResponseFormat