use rclean::{PatternType, WalkOptions};
fn main() -> Result<(), Box<dyn std::error::Error>> {
println!("RDedupe DataFrame Analysis Example\n");
let pattern = PatternType::Literal("".to_string());
let walk_options = WalkOptions {
include_hidden: false,
respect_gitignore: true,
respect_ignore: true,
max_depth: None,
};
println!("Analyzing current directory for duplicates...\n");
let df = rclean::run_with_advanced_options(
".",
&pattern,
&walk_options,
None, )?;
println!("Analysis complete!");
println!("Total files analyzed: {}", df.height());
if let Ok(stats_df) = rclean::generate_statistics(&df) {
println!("\n=== Statistics ===");
println!("{}", stats_df);
}
if let Err(e) = rclean::validate_duplicates(&df) {
eprintln!("Validation error: {}", e);
}
println!("\n=== Similarity Analysis ===");
println!("Running similarity analysis with 70% threshold...");
let _similar_df = rclean::run_with_similarity(
".",
&pattern,
&walk_options,
70, None,
)?;
println!("Similarity analysis complete!");
Ok(())
}