1pub mod attention;
2pub mod baseline;
3pub mod benchmark;
4pub mod beta_branch;
5pub mod checkpoint;
6pub mod compressor;
7pub mod config;
8pub mod data;
9pub mod delta_operator;
10pub mod delta_res_block;
11pub mod embed_expander;
12pub mod error;
13pub mod eval;
14pub mod generation;
15pub mod k_branch;
16pub mod lm;
17pub mod mlp;
18pub mod rms_norm;
19pub mod rope;
20pub mod shortconv;
21pub mod spectral;
22pub mod training;
23pub mod transformer;
24pub mod utils;
25pub mod v_branch;
26pub mod variant;
27
28pub use attention::{MultiHeadAttention, MultiHeadAttentionConfig};
29pub use baseline::{BaselineTransformer, BaselineTransformerBlock};
30pub use benchmark::{
31 BenchmarkCase, BenchmarkComparisonReport, BenchmarkConfig, BenchmarkDelta, BenchmarkError,
32 BenchmarkGateOutcome, BenchmarkMemory, BenchmarkRegressionThresholds, BenchmarkReport,
33 BenchmarkSuite, BenchmarkTarget, BenchmarkTiming, CompressorBenchmarks,
34 DeltaOperatorBenchmarks, DeltaResBlockBenchmarks, ModelBenchmark, ModelBenchmarkComparison,
35 ModelBenchmarkSummary, ModelMemoryBreakdown, NormalizationBenchmarks,
36 compare_benchmark_reports, run_benchmarks,
37};
38pub use beta_branch::BetaBranch;
39pub use checkpoint::{
40 CheckpointError, CheckpointManifest, LoadedTrainingArtifact, load_checkpoint, load_manifest,
41 load_training_artifact, load_training_comparison_report, load_training_report, save_checkpoint,
42 save_training_artifact, save_training_comparison_report, save_training_report,
43 save_training_sweep,
44};
45pub use compressor::{ChannelConvCompressor, TokenConvCompressor};
46pub use config::{CompressionVariant, DdlConfig, DdlMapping};
47pub use data::{
48 TailStrategy, TokenBatch, TokenBatcher, TokenBatchingConfig, TokenDataset, TokenDatasetSummary,
49};
50pub use delta_operator::DeltaOperator;
51pub use delta_res_block::DeltaResBlock;
52pub use embed_expander::EmbeddingExpander;
53pub use error::{BaselineConfigError, ConfigValidationError, DataValidationError, SpectralError};
54pub use eval::{
55 ComparisonReport, DatasetComparisonReport, DatasetTiming, DatasetVariantEvaluation, EvalError,
56 VariantEvaluation, compare_variants, compare_variants_on_dataset,
57 compare_variants_on_dataset_with_diagnostics, compare_variants_with_diagnostics,
58 evaluate_variant, evaluate_variant_on_dataset, evaluate_variant_on_dataset_with_diagnostics,
59 evaluate_variant_with_diagnostics,
60};
61pub use generation::{
62 AutoregressiveModel, FinishReason, GenerationConfig, GenerationError, GenerationResult,
63 GenerationStep, generate_tokens,
64};
65pub use k_branch::{KMapBranch, VMapKBranch};
66pub use lm::{
67 CausalLmLossSummary, CausalLmMetrics, aggregate_causal_lm_summaries,
68 causal_language_model_loss, causal_language_model_metrics,
69 causal_language_model_metrics_with_lengths, causal_language_model_summary,
70 causal_language_model_summary_with_lengths,
71};
72pub use mlp::{SwiGluMlp, SwiGluMlpConfig};
73pub use spectral::{
74 BetaHistogram, DeltaRegime, DeltaResInfo, LayerDiagnostics, LayerSpectralInfo,
75 ModelDiagnostics, SpectralCollector, SpectralDiagnostics, SpectralInfo, Sublayer,
76};
77pub use training::{
78 CosineWarmupSchedule, TrainingComparisonReport, TrainingConfig, TrainingError, TrainingOutcome,
79 TrainingReport, TrainingSpectralSnapshot, TrainingStepMetrics, TrainingSweepOutcome,
80 resume_training, train_variant, train_variants,
81};
82pub use transformer::{DdlTransformer, DdlTransformerBlock};
83pub use v_branch::{MatrixValueBranch, ScalarValueBranch};
84pub use variant::{DiagnosticLevel, ModelInstance, ModelOutput, ModelVariant};