List of all items
Structs
- auto_config::AutoConfigDecision
- auto_config::CompiledKernelFeatures
- auto_config::FerrumConfigBuilder
- auto_config::HardwareCapabilities
- auto_config::ModelCapabilities
- auto_config::MoeCapabilities
- auto_config::RejectedCandidate
- auto_config::ResolvedFerrumConfig
- auto_config::WorkloadProfile
- config::BackendConfig
- config::BatchConfig
- config::EngineConfig
- config::EngineModelConfig
- config::KvCacheConfig
- config::MemoryConfig
- config::MonitoringConfig
- config::PaddingConfig
- config::RuntimeKnobs
- config::SamplingConfig
- config::SchedulerConfig
- config::SecurityConfig
- config::TokenizerConfig
- config::TruncationConfig
- ids::BatchId
- ids::ClientId
- ids::ModelId
- ids::RequestId
- ids::SessionId
- ids::TaskId
- ids::TokenId
- metrics::AllocationInfo
- metrics::BatchingMetrics
- metrics::BuildInfo
- metrics::CacheStats
- metrics::ComponentHealth
- metrics::ComponentStatus
- metrics::DetailedResourceUsage
- metrics::DiagnosticsReport
- metrics::DiskMetrics
- metrics::EngineMetrics
- metrics::EngineRequestProgress
- metrics::EngineRequestState
- metrics::EngineState
- metrics::EngineStatus
- metrics::ErrorEvent
- metrics::ErrorStats
- metrics::GpuMemoryDetails
- metrics::GpuMetrics
- metrics::HardwareConstraints
- metrics::HealthStatus
- metrics::LatencyMetrics
- metrics::LatencyRequirements
- metrics::MemoryUsage
- metrics::ModelMetrics
- metrics::NetworkIODetails
- metrics::NetworkMetrics
- metrics::PerformanceAnalysis
- metrics::PerformanceBottleneck
- metrics::PerformanceBreakdown
- metrics::PerformanceRecommendation
- metrics::PerformanceTrends
- metrics::PhaseMetrics
- metrics::PrefixCacheStats
- metrics::QueueMetrics
- metrics::RequestCharacteristics
- metrics::RequestMetrics
- metrics::ResourceMetrics
- metrics::RuntimeInfo
- metrics::SchedulerStats
- metrics::SpeculationConfig
- metrics::SystemInfo
- metrics::SystemMetrics
- metrics::ThroughputMetrics
- metrics::WarmupResult
- models::AttentionConfig
- models::ModelConfig
- models::ModelInfo
- models::ModelMemoryRequirements
- models::RopeScaling
- models::TokenUsage
- requests::ApiChatMessage
- requests::ApiChatRequest
- requests::ApiChatResponse
- requests::ApiCompletionRequest
- requests::ApiCompletionResponse
- requests::ApiFunction
- requests::ApiFunctionCall
- requests::ApiJsonSchema
- requests::ApiResponseFormat
- requests::ApiStreamOptions
- requests::ApiTool
- requests::ApiToolCall
- requests::ApiToolChoiceFunction
- requests::BatchRequest
- requests::InferenceRequest
- requests::InferenceResponse
- requests::ScheduledRequest
- requests::StreamChunk
- runtime_config::RuntimeConfigEntry
- runtime_config::RuntimeConfigSnapshot
- sampling::MirostatParams
- sampling::SamplingParams
- sampling::SamplingPresets
- sampling::SpecialTokens
Enums
- auto_config::AutoConfigError
- auto_config::AutoConfigSource
- auto_config::WorkloadPriority
- config::BackendType
- config::KvCacheDtype
- config::KvCacheType
- config::PaddingStrategy
- config::SchedulingPolicy
- config::TokenizerType
- config::TruncationStrategy
- devices::DataType
- devices::Device
- errors::FerrumError
- metrics::HealthStatusType
- metrics::TrendDirection
- models::Activation
- models::ModelSource
- models::ModelType
- models::NormType
- models::QuantizationConfig
- requests::ApiFunctionCallChoice
- requests::ApiMessageRole
- requests::ApiRequest
- requests::ApiResponse
- requests::ApiToolChoice
- requests::RequestState
- runtime_config::EnvTriState
- runtime_config::RuntimeConfigEffect
- runtime_config::RuntimeConfigSource
- sampling::FinishReason
- sampling::Priority
- sampling::ResponseFormat
Functions
- requests::api_response_from_generated_text
- requests::chat_api_may_emit_tool_or_function_call
- requests::chat_api_response_from_generated_text
- runtime_config::active_runtime_snapshot
- runtime_config::install_runtime_snapshot
- runtime_config::parse_bool_env_value
- runtime_config::parse_path_env_value
- runtime_config::parse_tri_state_env_value
- runtime_config::parse_usize_env_value