pub struct DataProfiler { /* private fields */ }Expand description
Data profiler
Implementations§
Source§impl DataProfiler
impl DataProfiler
Sourcepub fn infer_data_type(&self, data: &[String]) -> DataType
pub fn infer_data_type(&self, data: &[String]) -> DataType
Infer data type from sample values
Sourcepub fn get_value_frequencies(&self, data: &[String]) -> Vec<ValueFrequency>
pub fn get_value_frequencies(&self, data: &[String]) -> Vec<ValueFrequency>
Get value frequencies
Sourcepub fn calculate_length_stats(&self, data: &[String]) -> LengthStats
pub fn calculate_length_stats(&self, data: &[String]) -> LengthStats
Calculate length statistics
Sourcepub fn calculate_numeric_stats(&self, data: &[String]) -> Option<NumericStats>
pub fn calculate_numeric_stats(&self, data: &[String]) -> Option<NumericStats>
Calculate numeric statistics
Sourcepub fn calculate_date_stats(&self, data: &[String]) -> Option<DateStats>
pub fn calculate_date_stats(&self, data: &[String]) -> Option<DateStats>
Calculate date statistics
Sourcepub fn calculate_text_stats(&self, data: &[String]) -> TextStats
pub fn calculate_text_stats(&self, data: &[String]) -> TextStats
Calculate text statistics
Source§impl DataProfiler
impl DataProfiler
Sourcepub fn with_max_distinct_values(self, max: usize) -> Self
pub fn with_max_distinct_values(self, max: usize) -> Self
Set maximum distinct values to track
Sourcepub fn with_sample_size(self, size: usize) -> Self
pub fn with_sample_size(self, size: usize) -> Self
Set sample size for large datasets
Source§impl DataProfiler
impl DataProfiler
Sourcepub fn calculate_column_quality_score(
&self,
null_percentage: f64,
unique_percentage: f64,
data_type: &DataType,
length_stats: Option<&LengthStats>,
numeric_stats: Option<&NumericStats>,
) -> f64
pub fn calculate_column_quality_score( &self, null_percentage: f64, unique_percentage: f64, data_type: &DataType, length_stats: Option<&LengthStats>, numeric_stats: Option<&NumericStats>, ) -> f64
Calculate column quality score
Sourcepub fn calculate_overall_quality_score(
&self,
columns: &[ColumnProfile],
null_percentage: f64,
duplicate_percentage: f64,
) -> f64
pub fn calculate_overall_quality_score( &self, columns: &[ColumnProfile], null_percentage: f64, duplicate_percentage: f64, ) -> f64
Calculate overall quality score
Sourcepub fn generate_recommendations(
&self,
columns: &[ColumnProfile],
null_percentage: f64,
duplicate_percentage: f64,
) -> Vec<String>
pub fn generate_recommendations( &self, columns: &[ColumnProfile], null_percentage: f64, duplicate_percentage: f64, ) -> Vec<String>
Generate data quality recommendations
Sourcepub fn generate_report(&self, profile: &DataProfile) -> String
pub fn generate_report(&self, profile: &DataProfile) -> String
Generate a human-readable profile report
Trait Implementations§
Auto Trait Implementations§
impl Freeze for DataProfiler
impl RefUnwindSafe for DataProfiler
impl Send for DataProfiler
impl Sync for DataProfiler
impl Unpin for DataProfiler
impl UnsafeUnpin for DataProfiler
impl UnwindSafe for DataProfiler
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more