List of all items
Structs
- BackendConfig
- BatchId
- ClientId
- ComponentHealth
- ComponentStatus
- EngineConfig
- EngineMetrics
- EngineStatus
- HealthStatus
- InferenceRequest
- InferenceResponse
- MemoryUsage
- ModelId
- ModelInfo
- RequestId
- SamplingParams
- SchedulerConfig
- SchedulerStats
- SessionId
- SpecialTokens
- StreamChunk
- TaskId
- TokenId
- TokenizerConfig
- kv_cache::AllocationRequest
- kv_cache::BlockTable
- kv_cache::CacheConfig
- kv_cache::CacheGcStats
- kv_cache::CacheHandleStats
- kv_cache::CacheManagerStats
- kv_cache::CompressionStats
- kv_cache::LruEvictionPolicy
- kv_cache::MemoryPressureThresholds
- kv_cache::PrefixCacheConfig
- kv_dtype::KvBf16
- kv_dtype::KvFp16
- kv_dtype::KvFp8
- kv_dtype::KvInt8
- model_executor::DecodeInput
- model_executor::DecodeOutput
- model_executor::ExecutorAttentionConfig
- model_executor::ExecutorCapabilities
- model_executor::ExecutorConfig
- model_executor::ExecutorMemoryConfig
- model_executor::ExecutorMemoryUsage
- model_executor::ExecutorMetrics
- model_executor::ExecutorStatus
- model_executor::MemoryRequirements
- model_executor::OptimizationConfig
- model_executor::PrefillInput
- model_executor::PrefillOutput
- model_executor::SpeculativeDecodeOutput
- model_executor::UnifiedBatch
- model_executor::UnifiedBatchItem
- sampler::GreedySampler
- sampler::LogitsProcessorChain
- sampler::MultinomialSampler
- sampler::RepetitionPenaltyProcessor
- sampler::SamplingConfig
- sampler::SamplingConfigBuilder
- sampler::SamplingContext
- sampler::SamplingStats
- sampler::TemperatureProcessor
- sampler::TopKProcessor
- sampler::TopPProcessor
- scheduler::AllocatedResources
- scheduler::BatchHint
- scheduler::BatchPlan
- scheduler::BatchResourceRequirements
- scheduler::BottleneckAnalysis
- scheduler::ClientResourceLimits
- scheduler::DynamicBatchingConfig
- scheduler::FairShareConfig
- scheduler::PreemptionResult
- scheduler::PreemptionState
- scheduler::QueueAnalysis
- scheduler::RequestPatternAnalysis
- scheduler::ResourceAwarenessConfig
- scheduler::ResourceConstraints
- scheduler::ResourceLimits
- scheduler::ResourceStats
- scheduler::ScheduledRequest
- scheduler::SchedulingSimulationResult
- scheduler::SeasonalityPattern
- scheduler::SimulatedWorkload
- scheduler::SlaConfig
- scheduler::SlaRequirements
- scheduler::WaitTimeDistribution
- tensor::TensorMemoryStats
- tokenizer::ChatMessage
- tokenizer::PaddingConfig
- tokenizer::TokenizerConfig
- tokenizer::TokenizerInfo
- tokenizer::TokenizerStats
- tokenizer::TruncationConfig
Enums
- DataType
- Device
- FerrumError
- FinishReason
- ModelSource
- ModelType
- Priority
- kv_cache::MemoryPressure
- model_executor::AttentionType
- model_executor::ExecutorState
- model_executor::ExecutorType
- sampler::ProcessorPriority
- scheduler::AdmissionDecision
- scheduler::ArrivalPattern
- scheduler::BottleneckType
- scheduler::RateTrend
- scheduler::SchedulingPolicy
- scheduler::SizeDistribution
- tokenizer::PaddingDirection
- tokenizer::PaddingStrategy
- tokenizer::TokenType
- tokenizer::TokenizerType
- tokenizer::TruncationStrategy
Traits
- engine::AdvancedInferenceEngine
- engine::EmbedEngine
- engine::InferenceEngine
- engine::LlmInferenceEngine
- engine::TranscribeEngine
- engine::TtsEngine
- kv_cache::AdvancedKvCacheManager
- kv_cache::BlockAllocator
- kv_cache::CacheEvictionPolicy
- kv_cache::KvCacheHandle
- kv_cache::KvCacheManager
- kv_cache::MultiDeviceCacheManager
- kv_dtype::KvDtypeKind
- model_executor::BatchModelExecutor
- model_executor::ExecutorRegistry
- model_executor::ModelExecutor
- model_executor::ModelExecutorFactory
- model_executor::SpeculativeExecutor
- sampler::LogitsProcessor
- sampler::MultiSampler
- sampler::Sampler
- scheduler::AdmissionPolicy
- scheduler::AdvancedScheduler
- scheduler::Scheduler
- tensor::AsyncTensorOps
- tensor::TensorBatchOps
- tensor::TensorDataAccess
- tensor::TensorFactory
- tensor::TensorLike
- tensor::TensorMemoryManager
- tensor::TensorOps
- tokenizer::AsyncTokenizer
- tokenizer::IncrementalTokenizer
- tokenizer::TextProcessor
- tokenizer::Tokenizer
- tokenizer::TokenizerCapabilities
- tokenizer::TokenizerFactory
- tokenizer::TokenizerRegistry