#[cfg(not(feature = "std"))]
use alloc::vec::Vec;
#[cfg(feature = "std")]
use std::vec::Vec;
use core::fmt::Debug;
use crate::algorithms::regression::{PolynomialDegree, SolverLinalg, ZeroWeightFallback};
use crate::algorithms::robustness::RobustnessMethod;
use crate::engine::executor::{
CVPassFn, FitPassFn, IntervalPassFn, KDTreeBuilderFn, LoessConfig, LoessExecutor, SmoothPassFn,
SurfaceMode, VertexPassFn,
};
use crate::engine::output::LoessResult;
use crate::engine::validator::Validator;
use crate::evaluation::cv::CVKind;
use crate::evaluation::diagnostics::Diagnostics;
use crate::evaluation::intervals::IntervalMethod;
use crate::math::boundary::BoundaryPolicy;
use crate::math::distance::{DistanceLinalg, DistanceMetric};
use crate::math::hat_matrix::HatMatrixStats;
use crate::math::kernel::WeightFunction;
use crate::math::linalg::FloatLinalg;
use crate::math::scaling::ScalingMethod;
use crate::primitives::backend::Backend;
use crate::primitives::errors::LoessError;
#[derive(Debug, Clone)]
pub struct BatchLoessBuilder<T: FloatLinalg + DistanceLinalg + SolverLinalg> {
pub fraction: T,
pub iterations: usize,
pub weight_function: WeightFunction,
pub robustness_method: RobustnessMethod,
pub scaling_method: ScalingMethod,
pub interval_type: Option<IntervalMethod<T>>,
pub cv_fractions: Option<Vec<T>>,
pub cv_kind: Option<CVKind>,
pub cv_seed: Option<u64>,
pub deferred_error: Option<LoessError>,
pub auto_converge: Option<T>,
pub return_diagnostics: bool,
pub compute_residuals: bool,
pub return_robustness_weights: bool,
pub zero_weight_fallback: ZeroWeightFallback,
pub boundary_policy: BoundaryPolicy,
pub polynomial_degree: PolynomialDegree,
pub dimensions: usize,
pub distance_metric: DistanceMetric<T>,
pub cell: Option<f64>,
pub interpolation_vertices: Option<usize>,
pub surface_mode: SurfaceMode,
pub boundary_degree_fallback: bool,
#[doc(hidden)]
pub(crate) duplicate_param: Option<&'static str>,
#[doc(hidden)]
pub custom_smooth_pass: Option<SmoothPassFn<T>>,
#[doc(hidden)]
pub custom_cv_pass: Option<CVPassFn<T>>,
#[doc(hidden)]
pub custom_interval_pass: Option<IntervalPassFn<T>>,
#[doc(hidden)]
pub custom_fit_pass: Option<FitPassFn<T>>,
#[doc(hidden)]
pub custom_vertex_pass: Option<VertexPassFn<T>>,
#[doc(hidden)]
pub custom_kdtree_builder: Option<KDTreeBuilderFn<T>>,
#[doc(hidden)]
pub backend: Option<Backend>,
#[doc(hidden)]
pub parallel: Option<bool>,
}
impl<T: FloatLinalg + DistanceLinalg + Debug + Send + Sync + SolverLinalg> Default
for BatchLoessBuilder<T>
{
fn default() -> Self {
Self::new()
}
}
impl<T: FloatLinalg + DistanceLinalg + Debug + Send + Sync + SolverLinalg> BatchLoessBuilder<T> {
fn new() -> Self {
Self {
fraction: T::from(0.67).unwrap(),
iterations: 3,
weight_function: WeightFunction::default(),
robustness_method: RobustnessMethod::default(),
scaling_method: ScalingMethod::default(),
interval_type: None,
cv_fractions: None,
cv_kind: None,
cv_seed: None,
deferred_error: None,
auto_converge: None,
return_diagnostics: false,
compute_residuals: false,
return_robustness_weights: false,
zero_weight_fallback: ZeroWeightFallback::default(),
boundary_policy: BoundaryPolicy::default(),
polynomial_degree: PolynomialDegree::default(),
dimensions: 1,
distance_metric: DistanceMetric::default(),
cell: None,
interpolation_vertices: None,
surface_mode: SurfaceMode::default(),
boundary_degree_fallback: true,
duplicate_param: None,
custom_smooth_pass: None,
custom_cv_pass: None,
custom_interval_pass: None,
custom_fit_pass: None,
custom_vertex_pass: None,
custom_kdtree_builder: None,
parallel: None,
backend: None,
}
}
pub fn fraction(mut self, fraction: T) -> Self {
self.fraction = fraction;
self
}
pub fn iterations(mut self, iterations: usize) -> Self {
self.iterations = iterations;
self
}
pub fn weight_function(mut self, wf: WeightFunction) -> Self {
self.weight_function = wf;
self
}
pub fn robustness_method(mut self, method: RobustnessMethod) -> Self {
self.robustness_method = method;
self
}
pub fn scaling_method(mut self, method: ScalingMethod) -> Self {
self.scaling_method = method;
self
}
pub fn zero_weight_fallback(mut self, fallback: ZeroWeightFallback) -> Self {
self.zero_weight_fallback = fallback;
self
}
pub fn boundary_policy(mut self, policy: BoundaryPolicy) -> Self {
self.boundary_policy = policy;
self
}
pub fn polynomial_degree(mut self, degree: PolynomialDegree) -> Self {
self.polynomial_degree = degree;
self
}
pub fn dimensions(mut self, dims: usize) -> Self {
self.dimensions = dims;
self
}
pub fn distance_metric(mut self, metric: DistanceMetric<T>) -> Self {
self.distance_metric = metric;
self
}
pub fn surface_mode(mut self, mode: SurfaceMode) -> Self {
self.surface_mode = mode;
self
}
pub fn cell(mut self, cell: f64) -> Self {
self.cell = Some(cell);
self
}
pub fn interpolation_vertices(mut self, vertices: usize) -> Self {
self.interpolation_vertices = Some(vertices);
self
}
pub fn boundary_degree_fallback(mut self, enabled: bool) -> Self {
self.boundary_degree_fallback = enabled;
self
}
pub fn auto_converge(mut self, tolerance: T) -> Self {
self.auto_converge = Some(tolerance);
self
}
pub fn compute_residuals(mut self, enabled: bool) -> Self {
self.compute_residuals = enabled;
self
}
pub fn return_robustness_weights(mut self, enabled: bool) -> Self {
self.return_robustness_weights = enabled;
self
}
pub fn return_diagnostics(mut self, enabled: bool) -> Self {
self.return_diagnostics = enabled;
self
}
pub fn confidence_intervals(mut self, level: T) -> Self {
self.interval_type = Some(IntervalMethod::confidence(level));
self
}
pub fn prediction_intervals(mut self, level: T) -> Self {
self.interval_type = Some(IntervalMethod::prediction(level));
self
}
pub fn cross_validate(mut self, fractions: Vec<T>) -> Self {
self.cv_fractions = Some(fractions);
self
}
pub fn cv_kind(mut self, kind: CVKind) -> Self {
self.cv_kind = Some(kind);
self
}
pub fn cv_seed(mut self, seed: u64) -> Self {
self.cv_seed = Some(seed);
self
}
pub fn return_se(mut self, enabled: bool) -> Self {
if enabled {
self.interval_type = Some(IntervalMethod::se());
} else if let Some(method) = self.interval_type {
if method.se && !method.confidence && !method.prediction {
self.interval_type = None;
}
}
self
}
#[doc(hidden)]
pub fn custom_smooth_pass(mut self, pass: SmoothPassFn<T>) -> Self {
self.custom_smooth_pass = Some(pass);
self
}
#[doc(hidden)]
pub fn custom_cv_pass(mut self, pass: CVPassFn<T>) -> Self {
self.custom_cv_pass = Some(pass);
self
}
#[doc(hidden)]
pub fn custom_interval_pass(mut self, pass: IntervalPassFn<T>) -> Self {
self.custom_interval_pass = Some(pass);
self
}
#[doc(hidden)]
pub fn backend(mut self, backend: Backend) -> Self {
self.backend = Some(backend);
self
}
#[doc(hidden)]
pub fn custom_kdtree_builder(mut self, kdtree_builder_fn: Option<KDTreeBuilderFn<T>>) -> Self {
self.custom_kdtree_builder = kdtree_builder_fn;
self
}
#[doc(hidden)]
pub fn parallel(mut self, parallel: bool) -> Self {
self.parallel = Some(parallel);
self
}
pub fn build(self) -> Result<BatchLoess<T>, LoessError> {
if let Some(err) = self.deferred_error {
return Err(err);
}
Validator::validate_no_duplicates(self.duplicate_param)?;
Validator::validate_fraction(self.fraction)?;
Validator::validate_iterations(self.iterations)?;
if let Some(ref method) = self.interval_type {
Validator::validate_interval_level(method.level)?;
}
if let Some(ref fracs) = self.cv_fractions {
Validator::validate_cv_fractions(fracs)?;
}
if let Some(CVKind::KFold(k)) = self.cv_kind {
Validator::validate_kfold(k)?;
}
if let Some(tol) = self.auto_converge {
Validator::validate_tolerance(tol)?;
}
Ok(BatchLoess { config: self })
}
}
#[derive(Clone)]
pub struct BatchLoess<T: FloatLinalg + DistanceLinalg + SolverLinalg> {
config: BatchLoessBuilder<T>,
}
impl<T: FloatLinalg + DistanceLinalg + Debug + Send + Sync + 'static + SolverLinalg> BatchLoess<T> {
pub fn fit(self, x: &[T], y: &[T]) -> Result<LoessResult<T>, LoessError> {
Validator::validate_inputs(x, y, self.config.dimensions)?;
if self.config.surface_mode == SurfaceMode::Interpolation {
let n = y.len();
let cell_to_use = self.config.cell.unwrap_or(0.2);
let limit = self.config.interpolation_vertices.unwrap_or(n);
let cell_provided = self.config.cell.is_some();
let limit_provided = self.config.interpolation_vertices.is_some();
Validator::validate_interpolation_grid(
T::from(cell_to_use).unwrap_or_else(|| T::from(0.2).unwrap()),
self.config.fraction,
self.config.dimensions,
limit,
cell_provided,
limit_provided,
)?;
}
let config = LoessConfig {
fraction: Some(self.config.fraction),
iterations: self.config.iterations,
weight_function: self.config.weight_function,
zero_weight_fallback: self.config.zero_weight_fallback,
robustness_method: self.config.robustness_method,
scaling_method: self.config.scaling_method,
cv_fractions: self.config.cv_fractions,
cv_kind: self.config.cv_kind,
auto_converge: self.config.auto_converge,
return_variance: self.config.interval_type,
boundary_policy: self.config.boundary_policy,
polynomial_degree: self.config.polynomial_degree,
dimensions: self.config.dimensions,
distance_metric: self.config.distance_metric.clone(),
cv_seed: self.config.cv_seed,
surface_mode: self.config.surface_mode,
interpolation_vertices: self.config.interpolation_vertices,
cell: self.config.cell,
boundary_degree_fallback: self.config.boundary_degree_fallback,
custom_smooth_pass: self.config.custom_smooth_pass,
custom_cv_pass: self.config.custom_cv_pass,
custom_interval_pass: self.config.custom_interval_pass,
custom_fit_pass: self.config.custom_fit_pass,
custom_vertex_pass: self.config.custom_vertex_pass,
custom_kdtree_builder: self.config.custom_kdtree_builder,
parallel: self.config.parallel.unwrap_or(false),
backend: self.config.backend,
};
let result = LoessExecutor::run_with_config(x, y, config);
let y_smooth = result.smoothed;
let std_errors = result.std_errors;
let iterations_used = result.iterations;
let fraction_used = result.used_fraction;
let cv_scores = result.cv_scores;
let residuals: Vec<T> = y
.iter()
.zip(y_smooth.iter())
.map(|(&orig, &smoothed_val)| orig - smoothed_val)
.collect();
let rob_weights = if self.config.return_robustness_weights {
result.robustness_weights
} else {
Vec::new()
};
let diagnostics = if self.config.return_diagnostics {
Some(Diagnostics::compute(
y,
&y_smooth,
&residuals,
std_errors.as_deref(),
))
} else {
None
};
let (enp, trace_hat, delta1, delta2, residual_scale, leverage_out) =
if let Some(lev) = result.leverage {
let stats = HatMatrixStats::from_leverage(lev);
let rss = residuals.iter().fold(T::zero(), |acc, &r| acc + r * r);
let res_scale = stats.compute_residual_scale(rss);
(
Some(stats.trace),
Some(stats.trace),
Some(stats.delta1),
Some(stats.delta2),
Some(res_scale),
Some(stats.leverage),
)
} else {
(None, None, None, None, None, None)
};
let (conf_lower, conf_upper, pred_lower, pred_upper) =
if let Some(method) = &self.config.interval_type {
if let Some(se) = &std_errors {
method.compute_intervals(&y_smooth, se, &residuals, delta1, delta2)?
} else {
(None, None, None, None)
}
} else {
(None, None, None, None)
};
let residuals_out = if self.config.compute_residuals {
Some(residuals)
} else {
None
};
let rob_weights_out = if self.config.return_robustness_weights {
Some(rob_weights)
} else {
None
};
Ok(LoessResult {
x: x.to_vec(),
dimensions: self.config.dimensions,
distance_metric: self.config.distance_metric.clone(),
polynomial_degree: self.config.polynomial_degree,
y: y_smooth,
standard_errors: std_errors,
confidence_lower: conf_lower,
confidence_upper: conf_upper,
prediction_lower: pred_lower,
prediction_upper: pred_upper,
residuals: residuals_out,
robustness_weights: rob_weights_out,
fraction_used,
iterations_used,
cv_scores,
diagnostics,
enp,
trace_hat,
delta1,
delta2,
residual_scale,
leverage: leverage_out,
})
}
}