1#![allow(deprecated)]
2#![warn(missing_docs)]
121
122pub mod advanced_generators;
123pub mod benchmarks;
124pub mod cache;
125pub mod cloud;
126pub mod distributed;
127pub mod domain_specific;
128pub mod error;
129pub mod explore;
130pub mod external;
131pub mod generators;
132pub mod gpu;
133pub mod gpu_optimization;
134pub mod loaders;
135pub mod ml_integration;
136pub mod real_world;
137pub mod registry;
138pub mod sample;
139pub mod streaming;
140pub mod time_series;
141pub mod toy;
142pub mod utils;
147
148pub mod stability;
153
154mod method_resolution_test;
156
157pub mod adaptive_streaming_engine;
158pub mod neuromorphic_data_processor;
159pub mod quantum_enhanced_generators;
160pub mod quantum_neuromorphic_fusion;
161
162pub use adaptive_streaming_engine::{
164 create_adaptive_engine, create_adaptive_engine_with_config, AdaptiveStreamConfig,
165 AdaptiveStreamingEngine, AlertSeverity, AlertType, ChunkMetadata, DataCharacteristics,
166 MemoryStrategy, PatternType, PerformanceMetrics, QualityAlert, QualityMetrics,
167 StatisticalMoments, StreamChunk, TrendDirection, TrendIndicators,
168};
169pub use advanced_generators::{
170 make_adversarial_examples, make_anomaly_dataset, make_continual_learning_dataset,
171 make_domain_adaptation_dataset, make_few_shot_dataset, make_multitask_dataset,
172 AdversarialConfig, AnomalyConfig, AnomalyType, AttackMethod, ContinualLearningDataset,
173 DomainAdaptationConfig, DomainAdaptationDataset, FewShotDataset, MultiTaskConfig,
174 MultiTaskDataset, TaskType,
175};
176pub use benchmarks::{BenchmarkResult, BenchmarkRunner, BenchmarkSuite, PerformanceComparison};
177pub use cloud::{
178 presets::{azure_client, gcs_client, public_s3_client, s3_client, s3_compatible_client},
179 public_datasets::{AWSOpenData, AzureOpenData, GCPPublicData},
180 CloudClient, CloudConfig, CloudCredentials, CloudProvider,
181};
182pub use distributed::{DistributedConfig, DistributedProcessor, ScalingMethod, ScalingParameters};
183pub use domain_specific::{
184 astronomy::StellarDatasets,
185 climate::ClimateDatasets,
186 convenience::{
187 list_domain_datasets, load_atmospheric_chemistry, load_climate_data, load_exoplanets,
188 load_gene_expression, load_stellar_classification,
189 },
190 genomics::GenomicsDatasets,
191 DomainConfig, QualityFilters,
192};
193pub use explore::{
194 convenience::{explore, export_summary, info, quick_summary},
195 DatasetExplorer, DatasetSummary, ExploreConfig, FeatureStatistics, InferredDataType,
196 OutputFormat, QualityAssessment,
197};
198#[cfg(not(feature = "download"))]
199pub use external::convenience::{load_github_dataset_sync, load_uci_dataset_sync};
200pub use external::{
201 convenience::{list_uci_datasets, load_from_url_sync},
202 repositories::{GitHubRepository, KaggleRepository, UCIRepository},
203 ExternalClient, ExternalConfig, ProgressCallback,
204};
205pub use ml_integration::{
206 convenience::{create_experiment, cv_split, prepare_for_ml, train_test_split},
207 CrossValidationResults, DataSplit, MLExperiment, MLPipeline, MLPipelineConfig,
208 ScalingMethod as MLScalingMethod,
209};
210
211pub use cache::{
212 get_cachedir, BatchOperations, BatchResult, CacheFileInfo, CacheManager, CacheStats,
213 DatasetCache, DetailedCacheStats,
214};
215#[cfg(feature = "download")]
216pub use external::convenience::{load_from_url, load_github_dataset, load_uci_dataset};
217pub use generators::{
218 add_time_series_noise, benchmark_gpu_vs_cpu, get_gpu_info, gpu_is_available,
219 inject_missing_data, inject_outliers, make_anisotropic_blobs, make_blobs, make_blobs_gpu,
220 make_circles, make_classification, make_classification_gpu, make_corrupted_dataset, make_helix,
221 make_hierarchical_clusters, make_intersecting_manifolds, make_manifold, make_moons,
222 make_regression, make_regression_gpu, make_s_curve, make_severed_sphere, make_spirals,
223 make_swiss_roll, make_swiss_roll_advanced, make_time_series, make_torus, make_twin_peaks,
224 ManifoldConfig, ManifoldType, MissingPattern, OutlierType,
225};
226pub use gpu::{
227 get_optimal_gpu_config, is_cuda_available, is_opencl_available, list_gpu_devices,
228 make_blobs_auto_gpu, make_classification_auto_gpu, make_regression_auto_gpu, GpuBackend,
229 GpuBenchmark, GpuBenchmarkResults, GpuConfig, GpuContext, GpuDeviceInfo, GpuMemoryConfig,
230};
231pub use gpu_optimization::{
232 benchmark_advanced_performance, generate_advanced_matrix, AdvancedGpuOptimizer,
233 AdvancedKernelConfig, BenchmarkResult as AdvancedBenchmarkResult, DataLayout,
234 LoadBalancingMethod, MemoryAccessPattern, PerformanceBenchmarkResults, SpecializationLevel,
235 VectorizationStrategy,
236};
237pub use loaders::{
238 load_csv, load_csv_legacy, load_csv_parallel, load_csv_streaming, load_json, load_raw,
239 save_json, CsvConfig, DatasetChunkIterator, StreamingConfig,
240};
241pub use neuromorphic_data_processor::{
242 create_neuromorphic_processor, create_neuromorphic_processor_with_topology, NetworkTopology,
243 NeuromorphicProcessor, NeuromorphicTransform, SynapticPlasticity,
244};
245pub use quantum_enhanced_generators::{
246 make_quantum_blobs, make_quantum_classification, make_quantum_regression,
247 QuantumDatasetGenerator,
248};
249pub use quantum_neuromorphic_fusion::{
250 create_fusion_with_params, create_quantum_neuromorphic_fusion, QuantumBioFusionResult,
251 QuantumInterference, QuantumNeuromorphicFusion,
252};
253pub use real_world::{
254 list_real_world_datasets, load_adult, load_california_housing, load_heart_disease,
255 load_red_wine_quality, load_titanic, RealWorldConfig, RealWorldDatasets,
256};
257pub use registry::{get_registry, load_dataset_byname, DatasetMetadata, DatasetRegistry};
258pub use sample::*;
259pub use streaming::{
260 stream_classification, stream_csv, stream_regression, DataChunk, StreamConfig, StreamProcessor,
261 StreamStats, StreamTransformer, StreamingIterator,
262};
263pub use toy::*;
264pub use utils::{
265 analyze_dataset_advanced, create_balanced_dataset, create_binned_features,
266 generate_synthetic_samples, importance_sample, k_fold_split, min_max_scale,
267 polynomial_features, quick_quality_assessment, random_oversample, random_sample,
268 random_undersample, robust_scale, statistical_features, stratified_k_fold_split,
269 stratified_sample, time_series_split, AdvancedDatasetAnalyzer, AdvancedQualityMetrics,
270 BalancingStrategy, BinningStrategy, CorrelationInsights, CrossValidationFolds, Dataset,
271 NormalityAssessment,
272};