List of all items
Structs
- backends::avx2::Avx2Backend
- backends::avx512::Avx512Backend
- backends::gpu::BufferId
- backends::gpu::GpuBackend
- backends::gpu::GpuCommandBatch
- backends::gpu::GpuDevice
- backends::gpu::GpuDevicePool
- backends::gpu::GpuMatmulCache
- backends::gpu::MaxOp
- backends::gpu::MinOp
- backends::gpu::PartitionView
- backends::gpu::QkvLoRA
- backends::gpu::SumOp
- backends::gpu::TensorView
- backends::gpu::TileInfo
- backends::gpu::WgslForwardPass
- backends::scalar::ScalarBackend
- backends::sse2::Sse2Backend
- blis::backend_selection::BackendCostModel
- blis::backend_selection::PtxMicrokernelSpec
- blis::backend_selection::UnifiedBrickProfiler
- blis::backend_selection::WgslMicrokernelSpec
- blis::cache_topology::BlisBlocking
- blis::cache_topology::CacheTopology
- blis::jidoka::JidokaGuard
- blis::parallel::HeijunkaScheduler
- blis::prepacked::PrepackedB
- blis::profiler::BlisLevelStats
- blis::profiler::BlisProfiler
- blis::profiler::KaizenMetrics
- brick::AddOp
- brick::AlignedBuffer
- brick::AmxTileConfig
- brick::AssertionResult
- brick::AsyncTaskProfiler
- brick::AttentionOp
- brick::AttentionTraceConfig
- brick::AttentionWeightTrace
- brick::Balance211Iter
- brick::BlockQ5K
- brick::BlockQ6K
- brick::BoundedQueue
- brick::BrickIdTimer
- brick::BrickLayer
- brick::BrickProfiler
- brick::BrickSample
- brick::BrickStats
- brick::BrickTimer
- brick::BrickVerification
- brick::BufferWatermarks
- brick::ByteBudget
- brick::CacheAligned
- brick::CategoryStats
- brick::CircuitBreaker
- brick::ComputeBrick
- brick::ConnectionState
- brick::DivergenceInfo
- brick::DotOp
- brick::DotQ5KOp
- brick::DotQ6KOp
- brick::DualWakerState
- brick::ExecutionEdge
- brick::ExecutionGraph
- brick::ExecutionNodeId
- brick::FusedGateUpOp
- brick::FusedGateUpWeights
- brick::FusedQKVOp
- brick::FusedQKVWeights
- brick::GracefulShutdown
- brick::GraphReuseCounter
- brick::KeepAliveConfig
- brick::KernelChecksum
- brick::KvCacheManager
- brick::KvCacheSessionTrace
- brick::KvCacheSlotInfo
- brick::KvCacheStateTrace
- brick::LayerActivationTrace
- brick::LazySimdConfig
- brick::LogitEvolutionTrace
- brick::ManagedConnection
- brick::MatmulOp
- brick::ModelActivationTrace
- brick::ModelQuantizationError
- brick::ModelTracer
- brick::ModelTracerConfig
- brick::ModelTracerSummary
- brick::PerfMetrics
- brick::PooledResource
- brick::PtxRegistry
- brick::QuantizationErrorTrace
- brick::ResourcePool
- brick::SequentialBatchOrderer
- brick::ServeLimits
- brick::ShutdownGuard
- brick::SoftmaxOp
- brick::StrategicBuffer
- brick::StreamCapacity
- brick::TensorStats
- brick::TileStats
- brick::TileTimer
- brick::TokenBudget
- brick::TokenLogitEvolution
- brick::TokenResult
- brick::UnrollTailIterator
- brick::WakeSkipState
- brick::WatermarkedBuffer
- chaos::ChaosConfig
- contracts::QuantFormat
- contracts::WeightBufferError
- eigen::EigenIterator
- eigen::SymmetricEigen
- hardware::CpuCapability
- hardware::GpuCapability
- hardware::HardwareCapability
- hardware::RooflineParams
- inference::generate::Rng
- inference::generate::SampleParams
- inference::gguf::GgufFile
- inference::gguf::TensorInfo
- inference::model::ForwardArena
- inference::model::KvCache
- inference::model::LayerWeights
- inference::model::LlamaModel
- inference::model::ModelConfig
- inference::model::ModelWeights
- matrix::Matrix
- monitor::DeviceId
- monitor::GpuClockMetrics
- monitor::GpuDeviceInfo
- monitor::GpuMemoryMetrics
- monitor::GpuMetrics
- monitor::GpuMonitor
- monitor::GpuPcieMetrics
- monitor::GpuPowerMetrics
- monitor::GpuThermalMetrics
- monitor::GpuUtilization
- monitor::MonitorConfig
- simulation::BackendSelector
- simulation::BackendTolerance
- simulation::BufferRenderer
- simulation::ColorPalette
- simulation::GoldenBaseline
- simulation::HeijunkaScheduler
- simulation::JidokaGuard
- simulation::NeedsSeed
- simulation::PixelDiffResult
- simulation::Ready
- simulation::Rgb
- simulation::SimTestConfig
- simulation::SimTestConfigBuilder
- simulation::SimulationTest
- simulation::StressAnomaly
- simulation::StressResult
- simulation::StressTestConfig
- simulation::StressThresholds
- simulation::VisualRegressionConfig
- tiling::TcbGeometry
- tiling::TcbIndexCalculator
- tiling::TiledQ4KMatvec
- tiling::TilingConfig
- tiling::TilingStats
- tuner::BottleneckClassifier
- tuner::BottleneckPrediction
- tuner::BrickTuner
- tuner::CalibrationResult
- tuner::ConceptDriftStatus
- tuner::FeatureExtractor
- tuner::KernelArm
- tuner::KernelBandit
- tuner::KernelClassifier
- tuner::KernelRecommendation
- tuner::OnlineLearner
- tuner::RunConfig
- tuner::ThroughputPrediction
- tuner::ThroughputRegressor
- tuner::TrainingSample
- tuner::TrainingStats
- tuner::TunerDataCollector
- tuner::TunerFeatures
- tuner::TunerFeaturesBuilder
- tuner::TunerRecommendation
- vector::Vector
Enums
- Backend
- OpComplexity
- OperationType
- backends::gpu::MemoryLayout
- blis::backend_selection::BrickLevel
- blis::backend_selection::ComputeBackend
- blis::backend_selection::RooflineResult
- blis::jidoka::JidokaError
- blis::profiler::BlisProfileLevel
- brick::AsyncResult
- brick::BatchSplitStrategy
- brick::BrickBottleneck
- brick::BrickCategory
- brick::BrickError
- brick::BrickId
- brick::CircuitState
- brick::ComputeAssertion
- brick::ComputeBackend
- brick::EdgeType
- brick::ExecutionNode
- brick::FlowControlError
- brick::InferencePhase
- brick::LimitError
- brick::MemoryAdvice
- brick::PrefetchLocality
- brick::QuantType
- brick::ReserveStrategy
- brick::ShutdownResult
- brick::SimdBackendState
- brick::SyncMode
- brick::TileLevel
- brick::TransferDirection
- brick::UnrollFactor
- brick::WakeDecision
- chaos::ChaosError
- contracts::TensorLayout
- error::TruenoError
- hardware::Bottleneck
- hardware::GpuBackend
- hardware::SimdWidth
- inference::gguf::GgmlType
- inference::gguf::MetadataValue
- inference::model::WeightMatrix
- monitor::DeviceType
- monitor::GpuBackend
- monitor::GpuVendor
- monitor::MonitorError
- simulation::BackendCategory
- simulation::JidokaAction
- simulation::JidokaCondition
- simulation::JidokaError
- simulation::StressAnomalyKind
- tiling::PackingLayout
- tiling::PrefetchLocality
- tiling::TcbLevel
- tiling::TilingBackend
- tiling::TilingError
- tuner::BottleneckClass
- tuner::ExperimentSuggestion
- tuner::KernelType
- tuner::QuantType
- tuner::UserFeedback
- tuner::error::TunerError
Traits
Macros
- dispatch_binary_op
- dispatch_reduction
- dispatch_unary_op
- time_brick
- vector::dispatch::dispatch_binary_op
- vector::dispatch::dispatch_reduction
- vector::dispatch::dispatch_unary_op
Functions
- activations::f16_to_f32
- activations::f32_to_f16
- activations::gelu_scalar
- activations::relu_scalar
- activations::sigmoid_scalar
- activations::silu_scalar
- activations::tanh_scalar
- backends::gpu::runtime::block_on
- backends::gpu::runtime::console_log
- backends::gpu::runtime::sync_available
- backends::gpu::tiled_max_2d
- backends::gpu::tiled_min_2d
- backends::gpu::tiled_reduce_2d
- backends::gpu::tiled_reduce_partial
- backends::gpu::tiled_sum_2d
- backends::q4k::dequantize_q4k_to_f32
- backends::q4k::matmul_q4k_f32
- backends::q4k::matmul_q4k_f32_colmajor
- backends::q4k::matmul_q4k_f32_colmajor_dispatch
- backends::q4k::matmul_q4k_f32_dispatch
- backends::q4k::matmul_q4k_f32_scalar
- backends::q6k::matmul_q6k_f32
- backends::q6k::matmul_q6k_f32_colmajor
- backends::q6k::matmul_q6k_f32_colmajor_dispatch
- backends::q6k::matmul_q6k_f32_dispatch
- backends::q6k::matmul_q6k_f32_scalar
- blis::attention::fused_attention_decode
- blis::backend_selection::gemm_auto
- blis::cache_topology::blocking_64x6_bcast_b
- blis::cache_topology::blocking_8x16
- blis::cache_topology::blocking_8x32
- blis::cache_topology::blocking_8x48
- blis::cache_topology::topology
- blis::compute::gemm_blis
- blis::compute::gemm_blis_broadcast_b
- blis::compute::gemm_blis_with_prepacked_b
- blis::elementwise::add
- blis::elementwise::add_alloc
- blis::elementwise::add_inplace
- blis::elementwise::fused_add_relu
- blis::elementwise::fused_add_relu_inplace
- blis::elementwise::fused_mul_add
- blis::elementwise::fused_scale_bias_relu
- blis::elementwise::mul_scalar
- blis::elementwise::mul_scalar_alloc
- blis::elementwise::relu
- blis::elementwise::relu_alloc
- blis::elementwise::relu_inplace
- blis::elementwise::scale_inplace
- blis::gemm
- blis::gemm_bias_relu
- blis::gemm_profiled
- blis::gemv::gemv
- blis::gemv::gemv_avx2
- blis::gemv::gemv_scalar
- blis::microkernels::codegen::microkernel_32x6_avx512_bcast_b
- blis::microkernels::codegen::microkernel_48x6_avx512_bcast_b
- blis::microkernels::codegen::microkernel_64x6_avx512_bcast_b
- blis::microkernels::codegen::microkernel_8x16_avx512_gen
- blis::microkernels::codegen::microkernel_8x32_avx512_gen
- blis::microkernels::codegen::microkernel_8x48_avx512_gen
- blis::microkernels::microkernel_16x8_avx512
- blis::microkernels::microkernel_32x6_avx512
- blis::microkernels::microkernel_8x6_avx2
- blis::microkernels::microkernel_8x6_avx2_asm
- blis::microkernels::microkernel_8x6_true_asm
- blis::microkernels::microkernel_8x8_avx2_fma
- blis::microkernels::microkernel_scalar
- blis::norms::layer_norm
- blis::norms::layer_norm_alloc
- blis::norms::rms_norm
- blis::norms::rms_norm_alloc
- blis::packing::pack_a
- blis::packing::pack_b
- blis::packing::packed_a_size
- blis::packing::packed_a_size_512
- blis::packing::packed_a_size_v2
- blis::packing::packed_b_size
- blis::packing::packed_b_size_512
- blis::packing::packed_b_size_v2
- blis::parallel::gemm_blis_parallel
- blis::parallel::gemm_blis_parallel_shared_b
- blis::parallel::gemm_blis_parallel_with_prepacked_b
- blis::reference::gemm_reference
- blis::reference::gemm_reference_with_jidoka
- blis::softmax::softmax_1d_alloc
- blis::transpose::transpose
- brick::balance211
- brick::cached_nanos
- brick::cached_nanos_or_now
- brick::cpu_cycles
- brick::fnv1a_f32_checksum
- brick::get_page_faults
- brick::init_time_service
- brick::is_direct_io_aligned
- brick::madvise_region
- brick::prefetch_for_inference
- brick::prefetch_ptr
- brick::prefetch_slice
- brick::reserve_capacity
- brick::split_batch
- brick::unroll_tail_process
- brick::with_page_fault_tracking
- contracts::format_by_ggml_type
- contracts::validate_f32_buffer
- contracts::validate_gemv_shapes
- contracts::validate_weight_buffer
- hardware::default_hardware_path
- hash::hash_bytes
- hash::hash_key
- hash::hash_keys_batch
- hash::hash_keys_batch_with_backend
- inference::generate::generate
- inference::generate::sample_token
- monitor::backends::cuda_monitor_available
- monitor::backends::enumerate_cuda_devices
- monitor::backends::query_cuda_device_info
- monitor::backends::query_cuda_memory
- select_backend_for_operation
- select_best_available_backend
- tiling::extract_scale_min_6bit
- tiling::f16_to_f32
- tiling::optimal_prefetch_distance
- tiling::pack_a_index
- tiling::pack_b_index
- tiling::swizzle_index
Type Aliases
Constants
- backends::gpu::TILE_SIZE
- backends::gpu::shaders::CAUSAL_ATTENTION_SHADER
- backends::gpu::shaders::COLUMN_GATHER_SHADER
- backends::gpu::shaders::COLUMN_SCATTER_SHADER
- backends::gpu::shaders::LORA_ADDMM_SHADER
- backends::gpu::shaders::MATMUL_SHADER
- backends::gpu::shaders::TILED_GEMM_SHADER
- backends::gpu::shaders::TRANSPOSE_SHADER
- backends::gpu::shaders::backward::ADAMW_STEP_SHADER
- backends::gpu::shaders::backward::CROSS_ENTROPY_BACKWARD_SHADER
- backends::gpu::shaders::backward::CROSS_ENTROPY_FORWARD_SHADER
- backends::gpu::shaders::backward::GEMM_BACKWARD_A_SHADER
- backends::gpu::shaders::backward::GEMM_BACKWARD_B_SHADER
- backends::gpu::shaders::backward::NF4_DEQUANT_SHADER
- backends::gpu::shaders::backward::RMSNORM_BACKWARD_SHADER
- backends::gpu::shaders::backward::ROPE_BACKWARD_SHADER
- backends::gpu::shaders::backward::SILU_BACKWARD_SHADER
- blis::KC
- blis::KC_512
- blis::KC_512V2
- blis::MC
- blis::MC_512
- blis::MC_512V2
- blis::MR
- blis::MR_512
- blis::MR_512V2
- blis::NC
- blis::NC_512
- blis::NC_512V2
- blis::NR
- blis::NR_512
- blis::NR_512V2
- brick::CACHE_LINE_SIZE
- brick::CACHE_LINE_SIZE_F32
- brick::DIRECT_IO_ALIGNMENT
- contracts::ALL_FORMATS
- contracts::Q4_0
- contracts::Q4_1
- contracts::Q4_K
- contracts::Q4_K_BLOCK_BYTES
- contracts::Q4_K_BLOCK_SIZE
- contracts::Q5_0
- contracts::Q5_K
- contracts::Q5_K_BLOCK_BYTES
- contracts::Q5_K_BLOCK_SIZE
- contracts::Q6_K
- contracts::Q6_K_BLOCK_BYTES
- contracts::Q6_K_BLOCK_SIZE
- contracts::Q8_0
- contracts::STACK_LAYOUT
- tiling::Q4K_SUPERBLOCK_BYTES
- tiling::Q4K_SUPERBLOCK_SIZE
- tuner::pretrained::FEATURE_IMPORTANCE
- tuner::pretrained::KERNEL_WEIGHTS
- tuner::pretrained::THROUGHPUT_WEIGHTS