scirs2_optimize/global/
bayesian.rs

1//! Bayesian optimization for global optimization of expensive-to-evaluate functions
2//!
3//! Bayesian optimization uses a surrogate model (usually Gaussian Process) to
4//! model the underlying objective function, and acquisition functions to determine
5//! the next points to evaluate, balancing exploration and exploitation.
6//!
7//! # Example
8//!
9//! ```
10//! use scirs2_core::ndarray::{array, ArrayView1};
11//! use scirs2_optimize::global::{bayesian_optimization, BayesianOptimizationOptions};
12//!
13//! // Define objective function (simple sphere)
14//! fn objective(x: &ArrayView1<f64>) -> f64 {
15//!     x[0].powi(2) + x[1].powi(2)
16//! }
17//!
18//! // Define search space
19//! let bounds = vec![(-2.0, 2.0), (-2.0, 2.0)];
20//!
21//! // Create optimizer options with more evaluations
22//! let mut options = BayesianOptimizationOptions::default();
23//! options.n_initial_points = 5;
24//!
25//! // Run optimization with more iterations
26//! let result = bayesian_optimization(objective, bounds, 30, Some(options)).expect("Operation failed");
27//!
28//! // Check result - should find a good solution
29//! assert!(result.success);
30//! println!("Best value found: {}", result.fun);
31//! # Ok::<(), scirs2_optimize::error::OptimizeError>(())
32//! ```
33
34use std::fmt;
35
36use scirs2_core::ndarray::{Array1, Array2, ArrayView1};
37use scirs2_core::random::rngs::StdRng;
38use scirs2_core::random::SeedableRng;
39use scirs2_core::random::{Rng, RngExt};
40use scirs2_stats::gaussian_process::{GaussianProcessRegressor, SquaredExponential};
41
42use crate::error::OptimizeError;
43use crate::parallel::ParallelOptions;
44use crate::unconstrained::{minimize, Method, OptimizeResult, Options};
45
46/// Wrapper for GaussianProcessRegressor to provide friedrich-compatible API
47struct GaussianProcess {
48    regressor: GaussianProcessRegressor<SquaredExponential>,
49    n_features: usize,
50}
51
52impl GaussianProcess {
53    /// Create a new GP from training data (friedrich-compatible API)
54    fn default(x_data: Vec<Vec<f64>>, y_data: Vec<f64>) -> Self {
55        let n_samples = x_data.len();
56        let n_features = if n_samples > 0 { x_data[0].len() } else { 0 };
57
58        // Convert Vec<Vec<f64>> to Array2
59        let mut x_flat = Vec::with_capacity(n_samples * n_features);
60        for row in &x_data {
61            x_flat.extend_from_slice(row);
62        }
63        let x_array =
64            Array2::from_shape_vec((n_samples, n_features), x_flat).expect("Operation failed");
65        let y_array = Array1::from_vec(y_data);
66
67        // Create and fit the regressor
68        let kernel = SquaredExponential::default();
69        let mut regressor = GaussianProcessRegressor::new(kernel);
70        regressor.fit(&x_array, &y_array).expect("Operation failed");
71
72        Self {
73            regressor,
74            n_features,
75        }
76    }
77
78    /// Predict mean at a single point (friedrich-compatible API)
79    fn predict(&self, x: &Vec<f64>) -> f64 {
80        let x_array =
81            Array2::from_shape_vec((1, self.n_features), x.clone()).expect("Operation failed");
82        let predictions = self.regressor.predict(&x_array).expect("Operation failed");
83        predictions[0]
84    }
85
86    /// Predict variance at a single point (friedrich-compatible API)
87    fn predict_variance(&self, x: &Vec<f64>) -> f64 {
88        let x_array =
89            Array2::from_shape_vec((1, self.n_features), x.clone()).expect("Operation failed");
90        let (_mean, std) = self
91            .regressor
92            .predict_with_std(&x_array)
93            .expect("Operation failed");
94        std[0] * std[0] // return variance (std²)
95    }
96}
97
98/// Parameter types for search space
99#[derive(Debug, Clone)]
100pub enum Parameter {
101    /// Continuous parameter with lower and upper bounds
102    Real(f64, f64),
103    /// Integer parameter with lower and upper bounds
104    Integer(i64, i64),
105    /// Categorical parameter with possible values
106    Categorical(Vec<String>),
107}
108
109/// Search space for parameters
110#[derive(Debug, Clone)]
111pub struct Space {
112    /// Parameters with names
113    parameters: Vec<(String, Parameter)>,
114    /// Dimensionality after transformation
115    transformed_n_dims: usize,
116    /// Bounds for parameters
117    bounds: Vec<(f64, f64)>,
118}
119
120impl Space {
121    /// Create a new search space
122    pub fn new() -> Self {
123        Self {
124            parameters: Vec::new(),
125            transformed_n_dims: 0,
126            bounds: Vec::new(),
127        }
128    }
129
130    /// Add a parameter to the search space
131    pub fn add<S: Into<String>>(mut self, name: S, parameter: Parameter) -> Self {
132        let name = name.into();
133
134        // Update transformed dimensionality
135        self.transformed_n_dims += match &parameter {
136            Parameter::Real(_, _) => 1,
137            Parameter::Integer(_, _) => 1,
138            Parameter::Categorical(values) => values.len(),
139        };
140
141        // Add bounds for this parameter
142        let bounds = match &parameter {
143            Parameter::Real(lower, upper) => (*lower, *upper),
144            Parameter::Integer(lower, upper) => (*lower as f64, *upper as f64),
145            Parameter::Categorical(_) => (0.0, 1.0),
146        };
147        self.bounds.push(bounds);
148
149        self.parameters.push((name, parameter));
150        self
151    }
152
153    /// Get number of dimensions in the original space
154    pub fn n_dims(&self) -> usize {
155        self.parameters.len()
156    }
157
158    /// Get number of dimensions in the transformed space
159    pub fn transformed_n_dims(&self) -> usize {
160        self.transformed_n_dims
161    }
162
163    /// Return dimension types for use with `BayesianOptimizer::set_dimension_types`.
164    pub fn dimension_types(&self) -> Vec<crate::bayesian::optimizer::DimensionType> {
165        use crate::bayesian::optimizer::DimensionType;
166        self.parameters
167            .iter()
168            .map(|(_, param)| match param {
169                Parameter::Integer(_, _) => DimensionType::Integer,
170                _ => DimensionType::Continuous,
171            })
172            .collect()
173    }
174
175    /// Sample random points from the space
176    pub fn sample(&self, n_samples: usize, rng: &mut StdRng) -> Vec<Array1<f64>> {
177        let n_dims = self.n_dims();
178        let mut samples = Vec::with_capacity(n_samples);
179
180        for _ in 0..n_samples {
181            let mut sample = Array1::zeros(n_dims);
182
183            for (i, (_, param)) in self.parameters.iter().enumerate() {
184                match param {
185                    Parameter::Real(lower, upper) => {
186                        // Use gen_range directly instead of Uniform distribution
187                        sample[i] = rng.random_range(*lower..*upper);
188                    }
189                    Parameter::Integer(lower, upper) => {
190                        let range = rng.random_range(*lower..=*upper);
191                        sample[i] = range as f64;
192                    }
193                    Parameter::Categorical(values) => {
194                        let index = rng.random_range(0..values.len());
195                        sample[i] = index as f64;
196                    }
197                }
198            }
199
200            samples.push(sample);
201        }
202
203        samples
204    }
205
206    /// Transform a point from the original space to the model space
207    pub fn transform(&self, x: &ArrayView1<f64>) -> Array1<f64> {
208        let mut transformed = Array1::zeros(self.transformed_n_dims);
209        let mut idx = 0;
210
211        for (i, (_, param)) in self.parameters.iter().enumerate() {
212            match param {
213                Parameter::Real(lower, upper) => {
214                    // Scale to [0, 1]
215                    transformed[idx] = (x[i] - lower) / (upper - lower);
216                    idx += 1;
217                }
218                Parameter::Integer(lower, upper) => {
219                    // Scale to [0, 1]
220                    transformed[idx] = (x[i] - *lower as f64) / (*upper as f64 - *lower as f64);
221                    idx += 1;
222                }
223                Parameter::Categorical(values) => {
224                    // One-hot encoding
225                    let index = x[i] as usize;
226                    for j in 0..values.len() {
227                        transformed[idx + j] = if j == index { 1.0 } else { 0.0 };
228                    }
229                    idx += values.len();
230                }
231            }
232        }
233
234        transformed
235    }
236
237    /// Transform a point from the model space back to the original space
238    pub fn inverse_transform(&self, x: &ArrayView1<f64>) -> Array1<f64> {
239        let mut inverse = Array1::zeros(self.n_dims());
240        let mut idx = 0;
241
242        for (i, (_, param)) in self.parameters.iter().enumerate() {
243            match param {
244                Parameter::Real(lower, upper) => {
245                    // Scale from [0, 1] to [lower, upper]
246                    inverse[i] = lower + x[idx] * (upper - lower);
247                    idx += 1;
248                }
249                Parameter::Integer(lower, upper) => {
250                    // Scale from [0, 1] to [lower, upper] and round
251                    let value = lower + (x[idx] * (*upper - *lower) as f64).round() as i64;
252                    inverse[i] = value as f64;
253                    idx += 1;
254                }
255                Parameter::Categorical(values) => {
256                    // Find index of maximum value in one-hot encoding
257                    let mut max_idx = 0;
258                    let mut max_val = x[idx];
259                    for j in 1..values.len() {
260                        if x[idx + j] > max_val {
261                            max_val = x[idx + j];
262                            max_idx = j;
263                        }
264                    }
265                    inverse[i] = max_idx as f64;
266                    idx += values.len();
267                }
268            }
269        }
270
271        inverse
272    }
273
274    /// Convert bounds to format used by the optimizer
275    pub fn bounds_to_vec(&self) -> Vec<(f64, f64)> {
276        self.parameters
277            .iter()
278            .map(|(_, param)| match param {
279                Parameter::Real(lower, upper) => (*lower, *upper),
280                Parameter::Integer(lower, upper) => (*lower as f64, *upper as f64),
281                Parameter::Categorical(_) => (0.0, 1.0), // Will be handled specially
282            })
283            .collect()
284    }
285}
286
287impl Default for Space {
288    fn default() -> Self {
289        Self::new()
290    }
291}
292
293/// Acquisition function trait for Bayesian optimization
294pub trait AcquisitionFunction: Send + Sync {
295    /// Evaluate acquisition function at a point
296    fn evaluate(&self, x: &ArrayView1<f64>) -> f64;
297
298    /// Compute gradient of acquisition function (if available)
299    fn gradient(&self, x: &ArrayView1<f64>) -> Option<Array1<f64>> {
300        None
301    }
302}
303
304/// Expected Improvement acquisition function
305pub struct ExpectedImprovement {
306    model: GaussianProcess,
307    y_best: f64,
308    xi: f64,
309}
310
311impl ExpectedImprovement {
312    /// Create a new Expected Improvement acquisition function
313    pub fn new(model: GaussianProcess, y_best: f64, xi: f64) -> Self {
314        Self { model, y_best, xi }
315    }
316}
317
318impl AcquisitionFunction for ExpectedImprovement {
319    fn evaluate(&self, x: &ArrayView1<f64>) -> f64 {
320        let mean = self.model.predict(&x.to_vec());
321        let std = (self.model.predict_variance(&x.to_vec())).sqrt();
322
323        if std <= 0.0 {
324            return 0.0;
325        }
326
327        let z = (self.y_best - mean - self.xi) / std;
328        // Use approximation for normal CDF and PDF since erf is unstable
329        let norm_cdf = 0.5 * (1.0 + approx_erf(z * std::f64::consts::SQRT_2 / 2.0));
330        let norm_pdf = (-0.5 * z.powi(2)).exp() / (2.0 * std::f64::consts::PI).sqrt();
331
332        let ei = (self.y_best - mean - self.xi) * norm_cdf + std * norm_pdf;
333
334        if ei < 0.0 {
335            0.0
336        } else {
337            ei
338        }
339    }
340
341    fn gradient(&self, x: &ArrayView1<f64>) -> Option<Array1<f64>> {
342        // For now, use numerical approximation
343        None
344    }
345}
346
347/// Lower Confidence Bound acquisition function
348pub struct LowerConfidenceBound {
349    model: GaussianProcess,
350    kappa: f64,
351}
352
353impl LowerConfidenceBound {
354    /// Create a new Lower Confidence Bound acquisition function
355    pub fn new(model: GaussianProcess, kappa: f64) -> Self {
356        Self { model, kappa }
357    }
358}
359
360impl AcquisitionFunction for LowerConfidenceBound {
361    fn evaluate(&self, x: &ArrayView1<f64>) -> f64 {
362        let mean = self.model.predict(&x.to_vec());
363        let std = (self.model.predict_variance(&x.to_vec())).sqrt();
364
365        mean - self.kappa * std
366    }
367
368    fn gradient(&self, x: &ArrayView1<f64>) -> Option<Array1<f64>> {
369        // For now, use numerical approximation
370        None
371    }
372}
373
374/// Probability of Improvement acquisition function
375pub struct ProbabilityOfImprovement {
376    model: GaussianProcess,
377    y_best: f64,
378    xi: f64,
379}
380
381impl ProbabilityOfImprovement {
382    /// Create a new Probability of Improvement acquisition function
383    pub fn new(model: GaussianProcess, y_best: f64, xi: f64) -> Self {
384        Self { model, y_best, xi }
385    }
386}
387
388impl AcquisitionFunction for ProbabilityOfImprovement {
389    fn evaluate(&self, x: &ArrayView1<f64>) -> f64 {
390        let mean = self.model.predict(&x.to_vec());
391        let std = (self.model.predict_variance(&x.to_vec())).sqrt();
392
393        if std <= 0.0 {
394            return 0.0;
395        }
396
397        let z = (self.y_best - mean - self.xi) / std;
398        // Use approximation for normal CDF since erf is unstable
399        0.5 * (1.0 + approx_erf(z * std::f64::consts::SQRT_2 / 2.0))
400    }
401
402    fn gradient(&self, x: &ArrayView1<f64>) -> Option<Array1<f64>> {
403        // For now, use numerical approximation
404        None
405    }
406}
407
408// Approximation of the error function (erf)
409// Abramowitz and Stegun formula 7.1.26
410#[allow(dead_code)]
411fn approx_erf(x: f64) -> f64 {
412    // Constants
413    let a1 = 0.254829592;
414    let a2 = -0.284496736;
415    let a3 = 1.421413741;
416    let a4 = -1.453152027;
417    let a5 = 1.061405429;
418    let p = 0.3275911;
419
420    // Save the sign of x
421    let sign = if x < 0.0 { -1.0 } else { 1.0 };
422    let x = x.abs();
423
424    // A&S formula 7.1.26
425    let t = 1.0 / (1.0 + p * x);
426    let y = 1.0 - (((((a5 * t + a4) * t) + a3) * t + a2) * t + a1) * t * (-x * x).exp();
427
428    sign * y
429}
430
431/// Acquisition function type enum for option selection
432#[derive(Debug, Clone, Copy, Default)]
433pub enum AcquisitionFunctionType {
434    /// Expected Improvement (default)
435    #[default]
436    ExpectedImprovement,
437    /// Lower Confidence Bound
438    LowerConfidenceBound,
439    /// Probability of Improvement
440    ProbabilityOfImprovement,
441}
442
443impl fmt::Display for AcquisitionFunctionType {
444    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
445        match self {
446            AcquisitionFunctionType::ExpectedImprovement => write!(f, "EI"),
447            AcquisitionFunctionType::LowerConfidenceBound => write!(f, "LCB"),
448            AcquisitionFunctionType::ProbabilityOfImprovement => write!(f, "PI"),
449        }
450    }
451}
452
453/// Kernel type enum for option selection
454#[derive(Debug, Clone, Copy, Default)]
455pub enum KernelType {
456    /// Squared Exponential (default)
457    #[default]
458    SquaredExponential,
459    /// Matérn 5/2
460    Matern52,
461    /// Matérn 3/2
462    Matern32,
463}
464
465impl fmt::Display for KernelType {
466    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
467        match self {
468            KernelType::SquaredExponential => write!(f, "SquaredExponential"),
469            KernelType::Matern52 => write!(f, "Matern52"),
470            KernelType::Matern32 => write!(f, "Matern32"),
471        }
472    }
473}
474
475/// Initial point generator type
476#[derive(Debug, Clone, Copy, Default)]
477pub enum InitialPointGenerator {
478    /// Random sampling (default)
479    #[default]
480    Random,
481    /// Latin Hypercube Sampling
482    LatinHypercube,
483    /// Sobol sequence
484    Sobol,
485    /// Halton sequence
486    Halton,
487}
488
489impl fmt::Display for InitialPointGenerator {
490    fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
491        match self {
492            InitialPointGenerator::Random => write!(f, "Random"),
493            InitialPointGenerator::LatinHypercube => write!(f, "LatinHypercube"),
494            InitialPointGenerator::Sobol => write!(f, "Sobol"),
495            InitialPointGenerator::Halton => write!(f, "Halton"),
496        }
497    }
498}
499
500/// Options for Bayesian optimization
501#[derive(Clone, Debug)]
502pub struct BayesianOptimizationOptions {
503    /// Number of initial points
504    pub n_initial_points: usize,
505    /// Initial point generator
506    pub initial_point_generator: InitialPointGenerator,
507    /// Acquisition function type
508    pub acq_func: AcquisitionFunctionType,
509    /// Kernel type for Gaussian Process
510    pub kernel: KernelType,
511    /// Exploration-exploitation trade-off for LCB
512    pub kappa: f64,
513    /// Exploration parameter for EI and PI
514    pub xi: f64,
515    /// Random seed for reproducibility
516    pub seed: Option<u64>,
517    /// Parallel computation options
518    pub parallel: Option<ParallelOptions>,
519    /// Number of restarts for acquisition optimization
520    pub n_restarts: usize,
521}
522
523impl Default for BayesianOptimizationOptions {
524    fn default() -> Self {
525        Self {
526            n_initial_points: 10,
527            initial_point_generator: InitialPointGenerator::default(),
528            acq_func: AcquisitionFunctionType::default(),
529            kernel: KernelType::default(),
530            kappa: 1.96,
531            xi: 0.01,
532            seed: None,
533            parallel: None,
534            n_restarts: 5,
535        }
536    }
537}
538
539/// Observation with input and output
540#[derive(Debug, Clone)]
541struct Observation {
542    /// Input point
543    x: Array1<f64>,
544    /// Function value
545    y: f64,
546}
547
548/// The Bayesian optimization algorithm
549pub struct BayesianOptimizer {
550    /// Search space
551    space: Space,
552    /// Optimization options
553    options: BayesianOptimizationOptions,
554    /// Observations
555    observations: Vec<Observation>,
556    /// Best observation so far
557    best_observation: Option<Observation>,
558    /// Random number generator
559    rng: StdRng,
560    /// Current iteration number
561    iteration: usize,
562}
563
564impl BayesianOptimizer {
565    /// Create a new Bayesian optimizer
566    pub fn new(space: Space, options: Option<BayesianOptimizationOptions>) -> Self {
567        let options = options.unwrap_or_default();
568        let seed = options
569            .seed
570            .unwrap_or_else(|| scirs2_core::random::rng().random());
571        let rng = StdRng::seed_from_u64(seed);
572
573        Self {
574            space,
575            options,
576            observations: Vec::new(),
577            best_observation: None,
578            rng,
579            iteration: 0,
580        }
581    }
582
583    /// Enforce integer dimension constraints by rounding and clamping
584    fn enforce_integer_dims(&self, x: &mut Array1<f64>) {
585        for (i, (_, param)) in self.space.parameters.iter().enumerate() {
586            if let Parameter::Integer(lo, hi) = param {
587                x[i] = x[i].round().clamp(*lo as f64, *hi as f64);
588            }
589        }
590    }
591
592    /// Ask for the next point to evaluate
593    pub fn ask(&mut self) -> Array1<f64> {
594        // If we don't have enough points, sample randomly
595        if self.observations.len() < self.options.n_initial_points {
596            let samples = match self.options.initial_point_generator {
597                InitialPointGenerator::Random => {
598                    // Simple random sampling
599                    self.space.sample(1, &mut self.rng)
600                }
601                InitialPointGenerator::LatinHypercube => {
602                    // Implement Latin Hypercube Sampling
603                    let dim = self.space.bounds.len();
604                    let n_samples = 1;
605
606                    // Create intervals for each dimension
607                    let mut sample = Array1::zeros(dim);
608
609                    for (i, (low, high)) in self.space.bounds.iter().enumerate() {
610                        // For single sample, pick random position in interval
611                        let interval_size = (high - low) / n_samples as f64;
612                        let offset = self.rng.random_range(0.0..1.0) * interval_size;
613                        sample[i] = low + offset;
614                    }
615
616                    vec![sample]
617                }
618                InitialPointGenerator::Sobol => {
619                    // Implement basic Sobol sequence
620                    let dim = self.space.bounds.len();
621                    let mut sample = Array1::zeros(dim);
622
623                    // Use iteration count as seed for Sobol sequence
624                    let seed = self.iteration as u32 + 1;
625
626                    for (i, (low, high)) in self.space.bounds.iter().enumerate() {
627                        // Simple digital scrambling based on Van der Corput sequence
628                        let mut n = seed;
629                        let mut denom = 1.0;
630                        let mut result = 0.0;
631                        let base = 2u32;
632
633                        while n > 0 {
634                            denom *= base as f64;
635                            result += (n % base) as f64 / denom;
636                            n /= base;
637                        }
638
639                        // Scale to bounds with dimension-specific offset
640                        let offset = ((i + 1) as f64 * 0.5).fract();
641                        let value = (result + offset).fract();
642                        sample[i] = low + value * (high - low);
643                    }
644
645                    vec![sample]
646                }
647                InitialPointGenerator::Halton => {
648                    // Implement Halton sequence
649                    let dim = self.space.bounds.len();
650                    let mut sample = Array1::zeros(dim);
651
652                    // First few prime numbers for Halton bases
653                    let primes = [2u32, 3, 5, 7, 11, 13, 17, 19, 23, 29, 31, 37, 41, 43, 47];
654                    let seed = self.iteration as u32 + 1;
655
656                    for (i, (low, high)) in self.space.bounds.iter().enumerate() {
657                        // Use different prime base for each dimension
658                        let base = if i < primes.len() {
659                            primes[i]
660                        } else {
661                            primes[i % primes.len()]
662                        };
663
664                        // Compute Halton value using radical inverse
665                        let mut n = seed;
666                        let mut denom = 1.0;
667                        let mut result = 0.0;
668
669                        while n > 0 {
670                            denom *= base as f64;
671                            result += (n % base) as f64 / denom;
672                            n /= base;
673                        }
674
675                        // Scale to bounds
676                        sample[i] = low + result * (high - low);
677                    }
678
679                    vec![sample]
680                }
681            };
682
683            self.iteration += 1;
684            let mut point = samples[0].clone();
685            self.enforce_integer_dims(&mut point);
686            return point;
687        }
688
689        // Otherwise, optimize the acquisition function
690        self.iteration += 1;
691        let mut point = self.optimize_acquisition_function();
692        self.enforce_integer_dims(&mut point);
693        point
694    }
695
696    /// Update with an observation
697    pub fn tell(&mut self, x: Array1<f64>, y: f64) {
698        let observation = Observation { x, y };
699
700        // Update best observation
701        if let Some(best) = &self.best_observation {
702            if y < best.y {
703                self.best_observation = Some(observation.clone());
704            }
705        } else {
706            self.best_observation = Some(observation.clone());
707        }
708
709        // Add to observations
710        self.observations.push(observation);
711    }
712
713    /// Build a Gaussian Process model from observations
714    fn build_model(&self) -> GaussianProcess {
715        // Prepare data
716        let mut x_data = Vec::with_capacity(self.observations.len());
717        let mut y_data = Vec::with_capacity(self.observations.len());
718
719        for obs in &self.observations {
720            let x_transformed = self.space.transform(&obs.x.view()).to_vec();
721            x_data.push(x_transformed);
722            y_data.push(obs.y);
723        }
724
725        // Build model using default settings (which uses squared exponential kernel)
726        // In a future implementation we could expose more kernel options
727        GaussianProcess::default(x_data, y_data)
728    }
729
730    /// Create an acquisition function
731    fn create_acquisition_function(&self) -> Box<dyn AcquisitionFunction> {
732        let model = self.build_model();
733        let y_best = self.best_observation.as_ref().expect("Operation failed").y;
734
735        match self.options.acq_func {
736            AcquisitionFunctionType::ExpectedImprovement => {
737                Box::new(ExpectedImprovement::new(model, y_best, self.options.xi))
738            }
739            AcquisitionFunctionType::LowerConfidenceBound => {
740                Box::new(LowerConfidenceBound::new(model, self.options.kappa))
741            }
742            AcquisitionFunctionType::ProbabilityOfImprovement => Box::new(
743                ProbabilityOfImprovement::new(model, y_best, self.options.xi),
744            ),
745        }
746    }
747
748    /// Optimize the acquisition function
749    fn optimize_acquisition_function(&mut self) -> Array1<f64> {
750        let acq_func = self.create_acquisition_function();
751        let bounds = self.space.bounds_to_vec();
752        let n_restarts = self.options.n_restarts;
753
754        // We want to minimize the negative acquisition function
755        let f = |x: &ArrayView1<f64>| -acq_func.evaluate(x);
756
757        // Starting points for optimization
758        let mut x_starts = self.space.sample(n_restarts, &mut self.rng);
759
760        // Add the current best point as one of the starting points
761        if let Some(best) = &self.best_observation {
762            if !x_starts.is_empty() {
763                x_starts[0] = best.x.clone();
764            } else {
765                x_starts.push(best.x.clone());
766            }
767        }
768
769        // Optimize from each starting point
770        let mut best_x = None;
771        let mut best_value = f64::INFINITY;
772
773        for x_start in x_starts {
774            let result = minimize(
775                f,
776                &x_start.to_vec(),
777                Method::LBFGS,
778                Some(Options {
779                    bounds: Some(
780                        crate::unconstrained::Bounds::from_vecs(
781                            bounds.iter().map(|b| Some(b.0)).collect(),
782                            bounds.iter().map(|b| Some(b.1)).collect(),
783                        )
784                        .expect("Operation failed"),
785                    ),
786                    ..Default::default()
787                }),
788            );
789
790            if let Ok(res) = result {
791                if res.fun < best_value {
792                    best_value = res.fun;
793                    best_x = Some(res.x);
794                }
795            }
796        }
797
798        // Return the best point found
799        let mut result = best_x.unwrap_or_else(|| {
800            // If optimization fails, return a random point
801            self.space.sample(1, &mut self.rng)[0].clone()
802        });
803        self.enforce_integer_dims(&mut result);
804        result
805    }
806
807    /// Run the full optimization process
808    pub fn optimize<F>(&mut self, func: F, n_calls: usize) -> OptimizeResult<f64>
809    where
810        F: Fn(&ArrayView1<f64>) -> f64,
811    {
812        let mut n_calls_remaining = n_calls;
813
814        // Initial random sampling
815        let n_initial = self.options.n_initial_points.min(n_calls);
816        let initial_points = self.space.sample(n_initial, &mut self.rng);
817
818        for point in initial_points {
819            let value = func(&point.view());
820            self.tell(point, value);
821            n_calls_remaining -= 1;
822
823            if n_calls_remaining == 0 {
824                break;
825            }
826        }
827
828        // Main optimization loop
829        let mut iterations = 0;
830
831        while n_calls_remaining > 0 {
832            // Get next point
833            let next_point = self.ask();
834
835            // Evaluate function
836            let value = func(&next_point.view());
837
838            // Update model
839            self.tell(next_point, value);
840
841            // Update counters
842            n_calls_remaining -= 1;
843            iterations += 1;
844        }
845
846        // Return final result
847        let best = self.best_observation.as_ref().expect("Operation failed");
848        OptimizeResult {
849            x: best.x.clone(),
850            fun: best.y,
851            nfev: self.observations.len(),
852            func_evals: self.observations.len(),
853            nit: iterations,
854            success: true,
855            message: "Optimization terminated successfully".to_string(),
856            ..Default::default()
857        }
858    }
859}
860
861/// Perform Bayesian optimization on a function
862#[allow(dead_code)]
863pub fn bayesian_optimization<F>(
864    func: F,
865    bounds: Vec<(f64, f64)>,
866    n_calls: usize,
867    options: Option<BayesianOptimizationOptions>,
868) -> Result<OptimizeResult<f64>, OptimizeError>
869where
870    F: Fn(&ArrayView1<f64>) -> f64,
871{
872    // Create space from bounds
873    let space = bounds
874        .into_iter()
875        .enumerate()
876        .fold(Space::new(), |space, (i, (lower, upper))| {
877            space.add(format!("x{}", i), Parameter::Real(lower, upper))
878        });
879
880    // Create optimizer
881    let mut optimizer = BayesianOptimizer::new(space, options);
882
883    // Run optimization
884    let result = optimizer.optimize(func, n_calls);
885
886    Ok(result)
887}
888
889#[cfg(test)]
890mod tests {
891    use super::*;
892    use scirs2_core::ndarray::array;
893
894    #[test]
895    fn test_space_creation() {
896        let space = Space::new()
897            .add("x1", Parameter::Real(-5.0, 5.0))
898            .add("x2", Parameter::Integer(0, 10))
899            .add(
900                "x3",
901                Parameter::Categorical(vec!["a".into(), "b".into(), "c".into()]),
902            );
903
904        assert_eq!(space.n_dims(), 3);
905        assert_eq!(space.transformed_n_dims(), 5); // 1 (real) + 1 (integer) + 3 (categorical)
906    }
907
908    #[test]
909    fn test_space_transform() {
910        let space = Space::new()
911            .add("x1", Parameter::Real(-5.0, 5.0))
912            .add("x2", Parameter::Integer(0, 10));
913
914        let x = array![0.0, 5.0];
915        let transformed = space.transform(&x.view());
916
917        assert_eq!(transformed.len(), 2);
918        assert!((transformed[0] - 0.5).abs() < 1e-6); // (0.0 - (-5.0)) / (5.0 - (-5.0)) = 0.5
919        assert!((transformed[1] - 0.5).abs() < 1e-6); // (5.0 - 0.0) / (10.0 - 0.0) = 0.5
920    }
921
922    #[test]
923    fn test_bayesian_optimization() {
924        // Simple quadratic function
925        let f = |x: &ArrayView1<f64>| x[0].powi(2) + x[1].powi(2);
926        let bounds = vec![(-5.0, 5.0), (-5.0, 5.0)];
927
928        let options = BayesianOptimizationOptions {
929            n_initial_points: 5,
930            seed: Some(42),
931            ..Default::default()
932        };
933
934        let result = bayesian_optimization(f, bounds, 15, Some(options)).expect("Operation failed");
935
936        // Should find minimum near (0, 0)
937        assert!(result.fun < 0.5);
938        assert!(result.x[0].abs() < 0.5);
939        assert!(result.x[1].abs() < 0.5);
940    }
941
942    #[test]
943    fn test_integer_dimension_enforcement() {
944        let space = Space::new().add("rating", Parameter::Integer(0, 3));
945        let options = BayesianOptimizationOptions {
946            n_initial_points: 2,
947            seed: Some(42),
948            ..Default::default()
949        };
950        let mut opt = BayesianOptimizer::new(space, Some(options));
951        let result = opt.optimize(
952            |x| {
953                let v = x[0];
954                (v - 2.0).abs()
955            },
956            6,
957        );
958        // All evaluated points must be integers in [0, 3]
959        for obs in &opt.observations {
960            let v = obs.x[0];
961            assert!(v >= 0.0 && v <= 3.0, "Out of bounds: {v}");
962            assert!((v - v.round()).abs() < 1e-12, "Not integer: {v}");
963        }
964        // Best should be x=2
965        assert!(
966            (result.x[0] - 2.0).abs() < 1e-12,
967            "Best x should be 2, got {}",
968            result.x[0]
969        );
970    }
971}
scirs2_optimize/global/bayesian.rs

scirs2_optimize/global/
bayesian.rs