Re-exports§
pub use caption::caption_file_exists_and_not_empty;
pub use caption::format_text_content;
pub use caption::json_to_text;
pub use caption::process_file;
pub use caption::replace_special_chars;
pub use caption::replace_string;
pub use core::TrainingFormat;
pub use core::TrainingSample;
pub use core::TrainingDataset;
pub use core::DatasetStats;
pub use core::BCOSample;
pub use core::BCODataset;
pub use core::DPOSample;
pub use core::DPODataset;
pub use core::PPOSample;
pub use core::PPODataset;
pub use core::SFTSample;
pub use core::SFTDataset;
pub use core::DatasetQualityReport;
pub use core::GenericJSONDataset;
Modules§
Structs§
- HfDataset
Config - Configuration for HuggingFace dataset processing
- HfProcessor
- Main processor for HuggingFace datasets
- Hugging
Face Dataset - Real HuggingFace dataset loader with Hub API integration