numdiff 0.7.3 - Docs.rs

use crate::constants::CBRT_EPS;
use linalg_traits::Vector;

/// Gradient of a multivariate, scalar-valued function using the central difference approximation.
///
/// # Arguments
///
/// * `f` - Multivariate, scalar-valued function, $f:\mathbb{R}^{n}\to\mathbb{R}$.
/// * `x0` - Evaluation point, $\mathbf{x}_{0}\in\mathbb{R}^{n}$.
/// * `h` - Relative step size, $h\in\mathbb{R}$. Defaults to [`CBRT_EPS`].
///
/// # Returns
///
/// Gradient of $f$ with respect to $\mathbf{x}$, evaluated at $\mathbf{x}=\mathbf{x}_{0}$.
///
/// $$\nabla f(\mathbf{x}_{0})\in\mathbb{R}^{n}$$
///
/// # Note
///
/// This function performs $2n$ evaluations of $f(\mathbf{x})$.
///
/// # Examples
///
/// ## Basic Example
///
/// Approximate the gradient of
///
/// $$f(\mathbf{x})=x_{0}^{5}+\sin^{3}{x_{1}}$$
///
/// at $\mathbf{x}=(5,8)^{T}$, and compare the result to the true result of
///
/// $$
/// \nabla f\left((5,8)^{T}\right)=
/// \begin{bmatrix}
///     3125 \\\\
///     3\sin^{2}{(8)}\cos{(8)}
/// \end{bmatrix}
/// $$
///
/// #### Using standard vectors
///
/// ```
/// use numtest::*;
///
/// use numdiff::central_difference::gradient;
///
/// // Define the function, f(x).
/// let f = |x: &Vec<f64>| x[0].powi(5) + x[1].sin().powi(3);
///
/// // Define the evaluation point.
/// let x0 = vec![5.0, 8.0];
///
/// // Approximate the gradient of f(x) at the evaluation point.
/// let grad: Vec<f64> = gradient(&f, &x0, None);
///
/// // True gradient of f(x) at the evaluation point.
/// let grad_true: Vec<f64> = vec![3125.0, 3.0 * 8.0_f64.sin().powi(2) * 8.0_f64.cos()];
///
/// // Check the accuracy of the gradient approximation.
/// assert_arrays_equal_to_decimal!(grad, grad_true, 6);
/// ```
///
/// #### Using other vector types
///
/// We can also use other types of vectors, such as `nalgebra::SVector`, `nalgebra::DVector`,
/// `ndarray::Array1`, `faer::Mat`, or any other type of vector that implements the
/// `linalg_traits::Vector` trait.
///
/// ```
/// use faer::Mat;
/// use linalg_traits::Vector;  // to provide from_slice method for faer::Mat
/// use nalgebra::{dvector, DVector, SVector};
/// use ndarray::{array, Array1};
/// use numtest::*;
///
/// use numdiff::central_difference::gradient;
///
/// let grad_true: Vec<f64> = vec![3125.0, 3.0 * 8.0_f64.sin().powi(2) * 8.0_f64.cos()];
///
/// // nalgebra::DVector
/// let f_dvector = |x: &DVector<f64>| x[0].powi(5) + x[1].sin().powi(3);
/// let x0_dvector: DVector<f64> = dvector![5.0, 8.0];
/// let grad_dvector: DVector<f64> = gradient(&f_dvector, &x0_dvector, None);
/// assert_arrays_equal_to_decimal!(grad_dvector, grad_true, 6);
///
/// // nalgebra::SVector
/// let f_svector = |x: &SVector<f64,2>| x[0].powi(5) + x[1].sin().powi(3);
/// let x0_svector: SVector<f64, 2> = SVector::from_row_slice(&[5.0, 8.0]);
/// let grad_svector: SVector<f64, 2> = gradient(&f_svector, &x0_svector, None);
/// assert_arrays_equal_to_decimal!(grad_svector, grad_true, 6);
///
/// // ndarray::Array1
/// let f_array1 = |x: &Array1<f64>| x[0].powi(5) + x[1].sin().powi(3);
/// let x0_array1: Array1<f64> = array![5.0, 8.0];
/// let grad_array1: Array1<f64> = gradient(&f_array1, &x0_array1, None);
/// assert_arrays_equal_to_decimal!(grad_array1, grad_true, 6);
///
/// // faer::Mat
/// let f_mat = |x: &Mat<f64>| x[(0, 0)].powi(5) + x[(1, 0)].sin().powi(3);
/// let x0_mat: Mat<f64> = Mat::from_slice(&[5.0, 8.0]);
/// let grad_mat: Mat<f64> = gradient(&f_mat, &x0_mat, None);
/// assert_arrays_equal_to_decimal!(grad_mat.as_slice(), grad_true, 6);
/// ```
///
/// #### Modifying the relative step size
///
/// We can also modify the relative step size. Choosing a coarser relative step size, we get a worse
/// approximation.
///
/// ```
/// use numtest::*;
///
/// use numdiff::central_difference::gradient;
///
/// let f = |x: &Vec<f64>| x[0].powi(5) + x[1].sin().powi(3);
/// let x0 = vec![5.0, 8.0];
///
/// let grad: Vec<f64> = gradient(&f, &x0, Some(0.001));
/// let grad_true: Vec<f64> = vec![3125.0, 3.0 * 8.0_f64.sin().powi(2) * 8.0_f64.cos()];
///
/// assert_arrays_equal_to_decimal!(grad, grad_true, 2);
/// ```
///
/// ## Example Passing Runtime Parameters
///
/// Approximate the gradient of a parameterized function
///
/// $$f(\mathbf{x})=ax_{0}^{2}+bx_{1}^{2}+cx_{0}x_{1}+d$$
///
/// where $a$, $b$, $c$, and $d$ are runtime parameters. Compare the result against the true
/// gradient of
///
/// $$\nabla f=\begin{bmatrix}2ax_{0}+cx_{1}\\\\2bx_{1}+cx_{0}\end{bmatrix}$$
///
/// ```
/// use numtest::*;
///
/// use numdiff::central_difference::gradient;
///
/// // Runtime parameters.
/// let a = 2.0;
/// let b = 1.5;
/// let c = 0.8;
/// let d = -3.0;
///
/// // Define the parameterized function.
/// fn f_param(x: &Vec<f64>, a: f64, b: f64, c: f64, d: f64) -> f64 {
///     a * x[0].powi(2) + b * x[1].powi(2) + c * x[0] * x[1] + d
/// }
///
/// // Wrap the parameterized function with a closure that captures the parameters.
/// let f = |x: &Vec<f64>| f_param(x, a, b, c, d);
///
/// // Evaluation point.
/// let x0 = vec![1.0, -2.0];
///
/// // True gradient function.
/// let grad_true = |x: &Vec<f64>| vec![2.0 * a * x[0] + c * x[1], 2.0 * b * x[1] + c * x[0]];
///
/// // Approximate the gradient and compare with true gradient.
/// let grad_eval: Vec<f64> = gradient(&f, &x0, None);
/// let grad_eval_true: Vec<f64> = grad_true(&x0);
/// assert_arrays_equal_to_decimal!(grad_eval, grad_eval_true, 9);
/// ```
pub fn gradient<V>(f: &impl Fn(&V) -> f64, x0: &V, h: Option<f64>) -> V
where
    V: Vector<f64>,
{
    // Copy the evaluation point so that we may modify it.
    let mut x0 = x0.clone();

    // Default the relative step size to h = ε¹ᐟ³ if not specified.
    let h = h.unwrap_or(*CBRT_EPS);

    // Determine the dimension of x.
    let n = x0.len();

    // Preallocate the vector to store the gradient.
    let mut g = V::new_with_length(n);

    // Variable to store the absolute step size in the kth direction.
    let mut dxk: f64;

    // Variable to store the original value of the evaluation point in the kth direction.
    let mut x0k: f64;

    // Evaluate the gradient.
    for k in 0..n {
        // Original value of the evaluation point in the kth direction.
        x0k = x0.vget(k);

        // Absolute step size in the kth direction.
        dxk = h * (1.0 + x0k.abs());

        // Step forward in the kth direction.
        x0.vset(k, x0.vget(k) + dxk);
        let f1 = f(&x0);

        // Step backward in the kth direction.
        x0.vset(k, x0k - dxk);
        let f2 = f(&x0);

        // Reset the evaluation point.
        x0.vset(k, x0k);

        // Partial derivative of f with respect to xₖ.
        g.vset(k, (f1 - f2) / (2.0 * dxk));
    }

    // Return the result.
    g
}

#[cfg(test)]
mod tests {
    use super::*;
    use nalgebra::SVector;
    use ndarray::{Array1, array};
    use numtest::*;

    #[test]
    fn test_gradient_1() {
        let f = |x: &Vec<f64>| x[0].powi(2);
        let x0 = vec![2.0];
        let g = |x: &Vec<f64>| vec![2.0 * x[0]];
        assert_arrays_equal_to_decimal!(gradient(&f, &x0, None), g(&x0), 11);
    }

    #[test]
    fn test_gradient_2() {
        let f = |x: &SVector<f64, 2>| x[0].powi(2) + x[1].powi(3);
        let x0: SVector<f64, 2> = SVector::from_slice(&[1.0, 2.0]);
        let g =
            |x: &SVector<f64, 2>| SVector::<f64, 2>::from_slice(&[2.0 * x[0], 3.0 * x[1].powi(2)]);
        assert_arrays_equal_to_decimal!(gradient(&f, &x0, None), g(&x0), 9);
    }

    #[test]
    fn test_gradient_3() {
        let f = |x: &Array1<f64>| x[0].powi(5) + x[1].sin().powi(3);
        let x0 = array![5.0, 8.0];
        let g = |x: &Array1<f64>| array![5.0 * x[0].powi(4), 3.0 * x[1].sin().powi(2) * x[1].cos()];
        assert_arrays_equal_to_decimal!(gradient(&f, &x0, None), g(&x0), 6);
    }
}