1pub mod aot_cache;
56pub mod attn_mask;
57pub mod backend;
58pub mod compile_cache;
59pub mod compiled;
60pub mod cost;
61pub mod device_ext;
62pub mod expert_pool;
63pub mod jacfwd;
64pub mod kernel_trace;
65pub mod kv_cache;
66pub mod lora_scheduler;
67pub mod memory_estimate;
68pub mod model_pipeline;
69pub mod moe_expert_store;
70pub mod op_registry;
71pub mod options;
72pub mod paged_kv;
73pub mod precision;
74pub mod record_replay;
75pub mod reflect;
76pub mod registry;
77pub mod router;
78pub mod session;
79pub mod stages;
80pub mod subgraph;
81pub mod trace;
82pub mod weight_registry;
83pub mod weights;
84pub mod worker_pool;
85pub use rlx_ir::perfetto;
90pub mod custom_ops;
91pub mod hwinfo;
92pub mod logit_verify;
93pub mod nan_check;
94pub mod phase;
95pub mod spec_decode;
96pub mod telemetry;
97pub mod validators;
98
99pub mod mock_requests;
102
103pub use rlx_driver::{Buffer, BufferHandle, CommandStream, Device, DeviceArena, SyncStream};
105pub use rlx_driver::{
107 CollectiveError, LocalTransport, Rank, SymmetricBuffer, SymmetricHeap, SymmetricTransport,
108};
109pub use aot_cache::{AotCache, AotCacheError};
111pub use backend::{Backend, ExecutableGraph, compile_hir, compile_module};
112pub use compile_cache::{
113 BucketedCompileCache, CacheRunInput, CompileCache, DynamicDimCompileCache, pad_rows, slice_rows,
114};
115pub use compiled::CompiledGraph;
116#[cfg(feature = "apple")]
117pub use device_ext::available_apple_devices;
118pub use device_ext::{
119 available_devices, dispatch_report_for_device, dispatch_report_for_device_with_options,
120 first_unsupported_op, first_unsupported_op_with_options, full_name, is_available,
121 legalize_graph_for_device, legalize_graph_for_device_with_options,
122 legalize_graph_for_device_with_report, supports, supports_graph, supports_graph_with_options,
123};
124pub use expert_pool::{
125 ExpertPool, ExpertPoolConfig, ExpertPoolStats, ExpertRefreshPolicy, ExpertRefreshResult,
126 MoEExecMode, gpu_expert_budget_from_vram,
127};
128pub use kv_cache::LayerKvCache;
129pub use memory_estimate::{MoeOffloadEstimate, estimate_moe_offload};
130pub use model_pipeline::ModelCompilePipeline;
131pub use options::CompileOptions;
132pub use precision::Precision;
133pub use reflect::{ModelReflection, load_hir_template_with_extensions, specialize_entry};
134pub use registry::{BackendFactory, backend_for, register_backend, registered_devices};
135#[cfg(feature = "cpu")]
136pub use rlx_cpu::moe_residency::MoeResidencyStats;
137#[cfg(feature = "cpu")]
138pub use rlx_cpu::moe_topk_capture::MoeTopkCapture;
139pub use rlx_driver::{ReduceKind, all_gather, all_reduce, reduce_scatter};
140pub use rlx_ir::env::{self, RlxEnv, RuntimeOverrides};
141pub use session::Session;
142pub use stages::{
143 compile_graph_stages, compile_graph_stages_for_backend, compile_hir_stages,
144 compile_module_stages, fusion_target_for, graph_from_lir, maybe_log_fusion,
145 options_with_supported_ops, pipeline_for,
146};
147pub use subgraph::{SubgraphCache, run_if, run_while};
148
149pub use expert_pool::{merged_resident_mask, per_layer_resident_masks};
150pub use moe_expert_store::{ExpertStackF32, LayerMoeWeights, MoeExpertStore};
151pub use weight_registry::{WeightEntry, WeightHandle, WeightKind, WeightRegistry};
152pub use weights::{BytesWeightLoader, WeightLoader};
153
154pub use rlx_ir::{AsyncCopy, BarrierToken, DoubleBuffer, SyncCopy};
158pub use rlx_ir::{CacheBuster, Tick, time_ns};
159
160pub use rlx_ir::{
162 inspect_graph, inspect_hir, inspect_hir_stats, inspect_lir, inspect_mir, inspect_mir_stats,
163};
164pub use rlx_opt::{OpKind, PrecisionPolicy};
165pub use rlx_opt::{PipelineInspect, inspect_pipeline};
166
167pub use rlx_ir::logical_kernel::{KernelDispatchConfig, KernelDispatchPolicy};
169pub use rlx_ir::op;
170pub use rlx_ir::{
171 BindingManifest, CompilationMode, DType, Graph, HirExtensionFn, HirReflection, IoBindingEntry,
172 ManifestDiff, ModelComponent, ModelPhase, ModelVariant, Node, NodeId, Op, Shape, WeightBlock,
173 apply_hir_extensions, register_hir_extension, registered_hir_extensions,
174};
175
176pub use rlx_macros::pipeline_schedule;
178pub use rlx_macros::rlx_model;