pub use rlx_core::{
BertConfig, EmbedGgufKind, FlowBuildExt, GgufDirGuide, GgufModelFamily, GgufTensorNameResolver,
LlamaFamilyGgufResolver, LoadOpts, LoadWeightsOptions, LoadedWeights, NomicBertConfig,
NomicVisionConfig, PassThroughGgufResolver, Qwen35NativeGgufResolver, RegisteredFormat,
ResolveOpts, ResolveWeightsOptions, STANDARD_DEVICE_NAMES, WeightDrainPolicy,
WeightFormatRegistration, WeightLoader, WeightMap, WeightMapSource, arch_registry,
assert_gguf_family, config, dataprocessing, flow_bridge, flow_util, format_for_extension,
gguf_architecture_str, gguf_dir_guide, gguf_f32_bytes_estimate, gguf_family_for_arch,
gguf_resolve, gguf_runner_hint, gguf_support, into_compile_parts, is_standard_device,
list_registered_formats, lm, load_from_path, load_weight_map_resolved, load_weights_resolved,
open as open_weights, open_map, open_map_with, open_with, register_gguf_tensor_resolver,
register_weight_format, resolve_weights_file, resolve_weights_file_with_options,
validate_sam_device, validate_standard_device, vision_ops_ir, weight_loader, weight_map,
weight_registry, weights,
};
pub use rlx_flow::{BuiltModel, CompileProfile};
pub mod bert {
pub use rlx_bert::bert::*;
}
pub mod bert_flow {
pub use rlx_bert::flow::*;
}
pub mod clinicalbert {
pub use rlx_clinicalbert::*;
}
pub mod nomic {
pub use rlx_nomic::nomic::*;
}
pub mod nomic_flow {
pub use rlx_nomic::flow::*;
}
pub mod vision {
pub use rlx_vision::vision::*;
}
pub mod vision_flow {
pub use rlx_vision::flow::*;
}
pub mod dinov2 {
pub use rlx_dinov2::*;
}
pub mod embed {
pub use rlx_embed::*;
}
pub mod flux2 {
pub use rlx_flux2::*;
}
pub mod diamond {
pub use rlx_diamond::*;
}
pub mod qwen3 {
pub use rlx_qwen3::*;
}
pub mod qwen35 {
pub use rlx_qwen35::*;
}
pub mod llama32 {
pub use rlx_llama32::*;
}
pub mod gemma {
pub use rlx_gemma::*;
}
pub mod llada2 {
pub use rlx_llada2::llada2::*;
}
pub mod tide {
pub use rlx_llada2::tide::*;
}
pub mod sam {
pub use rlx_sam::*;
}
pub mod sam2 {
pub use rlx_sam2::*;
}
pub mod sam3 {
pub use rlx_sam3::*;
}
pub mod vjepa2 {
pub use rlx_vjepa2::*;
}
pub mod wav2vec2_bert {
pub use rlx_wav2vec2_bert::*;
}
pub mod whisper {
pub use rlx_whisper::*;
}
pub mod vad {
pub use rlx_vad::*;
}
pub mod voxtral {
pub use rlx_voxtral::*;
}
pub mod voxtral_tts {
pub use rlx_voxtral_tts::*;
}
pub mod qwen3_tts {
pub use rlx_qwen3_tts::*;
}
pub mod locateanything {
pub use rlx_locateanything::*;
}
pub mod ocr {
pub use rlx_ocr::*;
}
pub mod neutts {
pub use rlx_neutts::*;
}
pub mod kittentts {
pub use rlx_kittentts::*;
}
pub use rlx_neutts::{
BackboneModel, DEFAULT_N_CTX, GenerationConfig, NeuCodecDecoder, NeuCodecEncoder, NeuTTS,
STOP_TOKEN, build_prompt, extract_ids,
};
#[deprecated(note = "use `rlx_models::ocr`")]
pub mod ocrs {
pub use rlx_ocr::*;
}
pub mod mistral {
pub use rlx_mistral::*;
}
pub mod bonsai {
pub use rlx_bonsai::*;
}
pub mod minicpm5 {
pub use rlx_minicpm5::*;
}
pub mod phi {
pub use rlx_phi::*;
}
pub mod omnicoder {
pub use rlx_omnicoder::*;
}
pub mod granite {
pub use rlx_granite::*;
}
pub mod cohere {
pub use rlx_cohere::*;
}
pub mod mask_hyper_matmul_ir {
pub use rlx_sam_ir::mask_hyper_matmul_ir::*;
}
pub mod mask_prompt_ir {
pub use rlx_sam_ir::mask_prompt_ir::*;
}
pub mod mlp_relu_ir {
pub use rlx_sam_ir::mlp_relu_ir::*;
}
pub mod twoway_transformer_ir {
pub use rlx_sam_ir::twoway_transformer_ir::*;
}
pub mod run;
mod sam_runner;
pub use rlx_core::flow_bridge::{
apply_compile_profile, compile_graph_encoder, compile_graph_legacy,
compile_graph_llama32_decode, compile_graph_llama32_prefill, compile_graph_qwen3_decode,
compile_graph_qwen3_prefill, compile_graph_qwen35_decode, compile_graph_qwen35_prefill,
compile_graph_sam, compile_graph_with_profile, load_compile_profile, profile_near_weights,
};
pub use rlx_core::flow_util::{
build_graph, built_from_graph, built_from_hir, built_from_hir_with_profile, compile_built,
compile_built_cpu, compile_graph_encoder_with_params, compile_graph_profile,
compile_graph_qwen3_prefill_with_params, compile_graph_qwen35_decode_with_params,
compile_graph_qwen35_prefill_with_params, compile_graph_sam_with_params, graph_from_built,
graph_from_hir,
};
pub use bert::{build_bert_graph, build_bert_graph_sized};
pub use bert_flow::{BertFlow, build_bert_built};
pub use dinov2::{
DinoV2Built, DinoV2Config, DinoV2Flow, DinoV2PreprocessWeights, build_dinov2_built,
build_dinov2_graph_sized,
};
pub use embed::{
Arch, BertTokenizer, EmbeddingModel, ImageEmbeddingModel, ModelArch, ModelInfo, Pooling,
RlxBertModel, RlxEmbed, RlxNomicModel, RlxVisionModel, TokenizedBatch, assemble_vision_hidden,
compile_model, detect_arch, embed_with_rlx, models_map,
};
pub use flux2::{
DEFAULT_TEXT_ENCODER_LAYERS, Flux2CfgCombineFlow, Flux2CfgCombineGraph, Flux2Checkpoint,
Flux2Config, Flux2Flow, Flux2ForwardBuilt, Flux2ForwardGraph, Flux2ForwardInput,
Flux2GraphParams, Flux2PromptOutput, Flux2Session, Flux2SessionCache, Flux2SessionKey,
Flux2TextEncoderBuilt, Flux2TextEncoderFlow, Flux2VaeConfig, Flux2VaeDecoderFlow,
Flux2VaeEncoderFlow, Flux2VaeGraph, Flux2VaeWeights, Flux2Weights, build_flux2_cfg_combine_hir,
build_flux2_forward_graph, build_flux2_forward_hir, build_flux2_minimal_graph,
build_flux2_minimal_hir, build_flux2_text_encoder_hir, cfg_combine, compile_flux2_cfg_combine,
compile_flux2_forward, compile_flux2_forward_via_flow, compile_flux2_minimal,
compile_flux2_text_encoder_hir, download_flux2_repo, encode_flux2_prompt,
encode_prompt_embeds_default_layers, encode_prompt_padded, extract_flux2_vae_weights,
extract_flux2_weights, extract_text_encoder_weights, flux2_decode_packed_latents,
flux2_prefers_compiled_hir, flux2_prefers_compiled_te, flux2_rgb_to_u8,
flux2_transformer_forward, host_temb, load_and_apply_flux2_lora, load_flux2_vae_weights,
load_flux2_weights, load_rgb_planar, load_text_encoder_weights, parse_lora_scale,
prepare_latent_ids, prepare_text_ids, prepare_weight_map, resolve_text_encoder_dir,
resolve_tokenizer_path, resolve_transformer_config, resolve_vae_dir, tiny_text_encoder_config,
};
pub use gemma::{
GemmaArch, GemmaConfig, GemmaFlow, GemmaGenerator, build_gemma_decode_graph_sized,
build_gemma_graph_sized, build_gemma_graph_sized_last_logits, build_gemma_graph_sized_packed,
encode_prompt as gemma_encode_prompt, encode_prompt_auto as gemma_encode_prompt_auto,
gemma_cfg_from_gguf, resolve_tokenizer_path as gemma_resolve_tokenizer_path,
};
pub use llada2::{
LLaDA2MoeConfig, LLaDA2Runner, LLaDA2RunnerBuilder, LLaDA2Weights, build_llada2_forward_graph,
default_memory_budget_bytes, validate_device as validate_llada2_device,
};
pub use llama32::{
Llama32Config, Llama32Flow, Llama32Generator, build_llama32_decode_graph_sized,
build_llama32_graph_sized, build_llama32_graph_sized_last_logits,
build_llama32_graph_sized_packed, encode_prompt as llama32_encode_prompt,
encode_prompt_auto as llama32_encode_prompt_auto, llama32_cfg_from_gguf,
resolve_tokenizer_path as llama32_resolve_tokenizer_path,
};
pub use nomic::{build_nomic_diagnostic_graph, build_nomic_graph_sized};
pub use nomic_flow::{NomicFlow, build_nomic_built};
pub use ocr::{
BLACK_VALUE, DEFAULT_ALPHABET, DecodeMethod, DetectionParams, DimOrder, HF_DETECTION_RTEN,
HF_DETECTION_ST, HF_RECOGNITION_RTEN, HF_RECOGNITION_ST, ImageSource, OcrConfig, OcrEngine,
OcrEngineParams, OcrInput, OcrOutput, OcrRunner, OcrRunnerBuilder, RotatedRect, TextChar,
TextLine, TextWord, resolve_model_dir,
};
pub use qwen3::{
Qwen3Config, Qwen3Flow, Qwen3Generator, Qwen3PrefillOpts, Qwen3Speculator, SampleOpts,
build_qwen3_graph_sized, build_qwen3_prefill_built, sample_token,
};
pub use qwen3_tts::{
HF_MODEL_ID_06B_CUSTOM as QWEN3_TTS_HF_MODEL_ID, PRESET_SPEAKERS as QWEN3_TTS_SPEAKERS,
Qwen3TtsBenchReport, Qwen3TtsConfig, Qwen3TtsRunner, Qwen3TtsWeightStore, TalkerEngine,
};
pub use qwen35::{
ChatMessage, ChatRole, MatWeight, Qwen35Config, Qwen35FullAttnLayer, Qwen35LayerFfn,
Qwen35LinearLayer, Qwen35MoeFfn, Qwen35MtpLayer, Qwen35PrefillOutput, Qwen35Runner,
Qwen35RunnerBuilder, Qwen35TrunkLayer, Qwen35Weights, build_qwen35_decode_graph,
build_qwen35_decode_hir_dynamic_ext, build_qwen35_graph_sized, build_qwen35_graph_sized_ext,
build_qwen35_graph_sized_stub, build_qwen35_prefill_cache_graph,
build_qwen35_prefill_cache_graph_ext, build_qwen35_prefill_cache_hir_dynamic_ext,
decode_step_feeds, encode_chat_auto, format_chatml, messages_from_prompt, mrope_prefill_feeds,
mrope_row_for_sections, mrope_slice_at_pos, mtp_draft_vocab_size, pack_input_ids,
parse_messages_json, recurrent_output_count, seed_cache_from_outputs,
supports_multimodal_mrope, synth as qwen35_synth, text_section_pos, validate_device,
zero_recurrent_inputs,
};
pub use rlx_flux2::{Flux2Output, Flux2Runner, Flux2RunnerBuilder};
pub use run::{
ConfigSource, DinoV2Output, DinoV2Runner, DinoV2RunnerBuilder, DinoV2Variant, Llama32Runner,
Llama32RunnerBuilder, LmRunner, ModelRunner, Precision, Qwen3Runner, Qwen3RunnerBuilder,
SamArch, SamPredictionAny, SamRunner, SamRunnerBuilder, Vjepa2Output, Vjepa2PoolOutput,
Vjepa2PredictOutput, Vjepa2Runner, Vjepa2RunnerBuilder, Wav2Vec2BertRunner,
Wav2Vec2BertRunnerBuilder, WeightFormat, debug_resolve_name, dispatch, dispatch_help,
list_mtp_keys, open_gguf_loader, open_loader, open_loader_resolved, open_loader_with_format,
register_runner, registered_runners, run_registered,
};
pub use sam::{
NeckWeights as SamNeckWeights, SamConfig, SamEncoderBuilt, SamEncoderConfig, SamEncoderFlow,
SamPreprocessWeights, apply_neck_host as sam_apply_neck_host,
assemble_patch_tokens as sam_assemble_patch_tokens, build_sam_encoder_built,
build_sam_encoder_graph, preprocess_image as sam_preprocess_image,
};
pub use sam2::{
FpnLevel as Sam2FpnLevel, FpnNeckWeights as Sam2FpnNeckWeights, Sam2, Sam2Config,
Sam2DecoderConfig, Sam2FpnConfig, Sam2HieraConfig, Sam2ImageEncoderBuilt, Sam2ImageEncoderFlow,
Sam2ImagePrediction, Sam2MaskDecoderOutput, Sam2MaskDecoderWeights, Sam2MemoryAttentionWeights,
Sam2MemoryConfig, Sam2MemoryEncoderConfig, Sam2MemoryEncoderOutput, Sam2MemoryEncoderWeights,
Sam2PreprocessWeights, Sam2PromptEncoderOutput, Sam2PromptEncoderWeights,
Sam2TwoWayTransformerWeights, Sam2VideoState, apply_fpn_neck as sam2_apply_fpn_neck,
apply_fpn_neck_host as sam2_apply_fpn_neck_host,
assemble_patch_tokens as sam2_assemble_patch_tokens, build_sam2_image_encoder_built,
build_sam2_image_encoder_graph, mask_decoder_forward as sam2_mask_decoder_forward,
memory_attention_forward as sam2_memory_attention_forward,
memory_encoder_forward as sam2_memory_encoder_forward,
preprocess_image as sam2_preprocess_image,
prompt_encoder_forward as sam2_prompt_encoder_forward,
two_way_transformer_forward as sam2_two_way_transformer_forward,
};
pub use sam3::{
Sam3, Sam3CompiledDecoder, Sam3Config, Sam3DetectorConfig, Sam3DetectorDecoderBuilt,
Sam3DetectorDecoderFlow, Sam3DetectorEncoderFlow, Sam3EncodedImage, Sam3ImagePrediction,
Sam3PreprocessWeights, Sam3TextConfig, Sam3TrackerConfig, Sam3VideoFramePrediction,
Sam3VideoState, Sam3VitConfig, assemble_patch_tokens as sam3_assemble_patch_tokens,
build_sam3_detector_decoder_built, build_sam3_detector_encoder_built,
build_sam3_detector_encoder_graph, forward_decoder_ir_on,
preprocess_image as sam3_preprocess_image,
};
pub use tide::{
BlockDenoiseConfig, BlockDenoiseLoop, GenerateConfig, PredictiveOffloadInfo,
PredictiveOffloadParams, TideOffloadStats, TideRunner, aggregate_offload_stats,
refresh_experts,
};
pub use vision::{VisionPreprocessWeights, build_vision_graph_sized};
pub use vision_flow::{NomicVisionBuilt, NomicVisionFlow, build_nomic_vision_built};
pub use vjepa2::{
Vjepa2Config, Vjepa2EncoderBuilt, Vjepa2EncoderFlow, Vjepa2EncoderOutput, Vjepa2EncoderWeights,
Vjepa2Masks, Vjepa2ModelWeights, Vjepa2PatchEmbedWeights, Vjepa2PoolerFlow,
Vjepa2PoolerWeights, Vjepa2PredictorFlow, Vjepa2PredictorWeights,
build_vjepa2_encoder_graph_sized, conv3d_patch_embed, encode_video_native,
extract_encoder_weights, extract_model_weights, extract_patch_embed_weights,
extract_pooler_weights, extract_predictor_weights, normalize_video_hwc, pool_native,
predict_native,
};
pub use voxtral::{
FAMILY as VOXTRAL_FAMILY, HF_MODEL_ID_MINI_3B, LanguageModelPrefixLoader,
MelSpectrogram as VoxtralMel, VoxtralAudioConfig, VoxtralConfig, VoxtralRunner,
VoxtralRunnerBuilder, VoxtralWeightPrefix, build_voxtral_decode_built,
build_voxtral_encoder_built, build_voxtral_prefill_built, build_voxtral_projector_built,
fuse_inputs_embeds, pcm_to_mel as voxtral_pcm_to_mel, transcription_prompt_ids,
};
pub use voxtral_tts::{
CodecDecoder, HF_MODEL_ID as VOXTRAL_TTS_HF_MODEL_ID, PRESET_VOICES as VOXTRAL_TTS_VOICES,
VoxtralTtsBenchReport, VoxtralTtsConfig, VoxtralTtsRunner, VoxtralTtsWeightStore,
};
pub use wav2vec2_bert::{
LogMelExtractor, LogMelFeatures, Wav2Vec2BertConfig, Wav2Vec2BertFlow,
Wav2Vec2BertPreprocessConfig, build_wav2vec2_bert_built, build_wav2vec2_bert_graph_sized,
load_wav_mono_f32,
};
pub use whisper::{
MelSpectrogram, WhisperConfig, WhisperDecoderFlow, WhisperEncoderFlow, WhisperKvCache,
WhisperRunner, WhisperRunnerBuilder, WhisperWeightPrefix, build_whisper_decode_step_built,
build_whisper_decoder_built, build_whisper_decoder_graph_sized,
build_whisper_decoder_prefill_built, build_whisper_encoder_built,
build_whisper_encoder_graph_sized, default_mel_frames, pcm_to_mel,
};