#![deny(unsafe_code)]
#![deny(missing_docs)]
#![deny(clippy::unwrap_used)]
#![deny(clippy::expect_used)]
#![cfg_attr(
test,
allow(
clippy::unwrap_used,
clippy::expect_used,
clippy::cast_lossless,
clippy::cast_possible_truncation,
clippy::cast_possible_wrap,
clippy::cast_precision_loss,
clippy::cloned_ref_to_slice_refs,
clippy::redundant_clone,
clippy::needless_collect,
clippy::too_many_lines,
clippy::for_kv_map,
clippy::bool_to_int_with_if,
clippy::float_cmp,
clippy::iter_on_single_items,
clippy::similar_names,
clippy::unreadable_literal
)
)]
#![allow(clippy::doc_markdown)]
#![allow(clippy::uninlined_format_args)]
#![allow(clippy::redundant_closure_for_method_calls)]
#![allow(clippy::map_unwrap_or)]
#![allow(clippy::useless_conversion)]
#[cfg(feature = "tokio-runtime")]
pub mod async_prefetch;
pub mod backend;
#[cfg(feature = "cli")]
pub mod cli;
pub mod dataloader;
pub mod dataset;
pub mod datasets;
pub mod drift;
pub mod error;
pub mod federated;
pub mod format;
#[cfg(feature = "hf-hub")]
pub mod hf_hub;
pub mod imbalance;
#[cfg(feature = "mmap")]
pub mod mmap;
pub mod parallel;
pub mod quality;
pub mod registry;
pub mod serve;
pub mod sketch;
pub mod split;
pub mod streaming;
pub mod tensor;
pub mod transform;
#[cfg(feature = "shuffle")]
pub mod weighted;
#[cfg(feature = "doctest")]
pub mod doctest;
#[cfg(feature = "repl")]
pub mod repl;
pub mod tui;
pub use arrow::{
array::RecordBatch,
datatypes::{Schema, SchemaRef},
};
#[cfg(feature = "tokio-runtime")]
pub use async_prefetch::{AsyncPrefetchBuilder, AsyncPrefetchDataset, SyncPrefetchDataset};
pub use dataloader::DataLoader;
pub use dataset::{ArrowDataset, CsvOptions, Dataset, JsonOptions};
#[cfg(feature = "doctest")]
pub use doctest::{DocTest, DocTestCorpus, DocTestParser};
pub use drift::{ColumnDrift, DriftDetector, DriftReport, DriftSeverity, DriftTest};
pub use error::{Error, Result};
pub use federated::{
FederatedSplitCoordinator, FederatedSplitStrategy, GlobalSplitReport, NodeSplitInstruction,
NodeSplitManifest, NodeSummary, SplitQualityIssue,
};
pub use imbalance::{
ClassDistribution, ImbalanceDetector, ImbalanceMetrics, ImbalanceRecommendation,
ImbalanceReport, ImbalanceSeverity, ResampleStrategy, sqrt_inverse_weights,
};
#[cfg(feature = "shuffle")]
pub use imbalance::resample;
#[cfg(feature = "mmap")]
pub use mmap::{MmapDataset, MmapDatasetBuilder};
pub use parallel::{ParallelDataLoader, ParallelDataLoaderBuilder};
pub use quality::{ColumnQuality, QualityChecker, QualityIssue, QualityProfile, QualityReport, TextColumnStats};
pub use sketch::{
Centroid, DDSketch, DataSketch, DistributedDriftDetector, SketchDriftResult, SketchType,
TDigest,
};
pub use split::DatasetSplit;
pub use transform::{
Cast, Chain, Drop, FillNull, FillStrategy, Filter, Map, NormMethod, Normalize, Rename, Select,
Skip, Sort, SortOrder, Take, Transform, Unique,
};
#[cfg(feature = "shuffle")]
pub use transform::{Fim, FimFormat, FimTokens, Sample, Shuffle};
pub use tui::{DatasetAdapter, DatasetViewer, RowDetailView, SchemaInspector, TuiError, TuiResult};
#[cfg(feature = "shuffle")]
pub use weighted::WeightedDataLoader;