neuralib 0.0.3 - Docs.rs

//! Activation functions for neuralib
//!
//! This module provides many different activation functions for a neural network.

#[cfg(feature = "serde")]
use serde::{Deserialize, Serialize};

/// The activation functions this library supports
#[derive(Clone, Debug, Default, Serialize, Deserialize)]
pub enum Activation {
    /// A linear activation function. The output is the same as the input
    #[default]
    Linear,
    /// The step activation function. The output is 0 if x<0 otherwise, it's 1
    Step,
    /// The sigmoid activation function: <https://en.wikipedia.org/wiki/Sigmoid_function>
    Sigmoid,
    /// The Hyperbolic Tangent activation function.
    HyperTan,
    /// The SiLU (Swish) activation function: <https://en.wikipedia.org/wiki/Rectified_linear_unit#SiLU>
    SiLU,
    /// The ReLU activation function: <https://en.wikipedia.org/wiki/Rectified_linear_unit>
    ReLU,
    /// The Leaky ReLU activation function: <https://en.wikipedia.org/wiki/Rectified_linear_unit#Piecewise-linear_variants>
    LeakyReLU,
}

impl Activation {
    /// Call the selected activation function
    pub fn call(&self, x: f64) -> f64 {
        match self {
            Activation::Linear => Activation::linear(x),
            Activation::Step => Activation::step(x),
            Activation::Sigmoid => Activation::sigmoid(x),
            Activation::HyperTan => Activation::hypertan(x),
            Activation::SiLU => Activation::si_lu(x),
            Activation::ReLU => Activation::re_lu(x),
            Activation::LeakyReLU => Activation::leaky_re_lu(x),
        }
    }

    pub fn derivative(&self, x: f64) -> f64 {
        match self {
            Activation::Linear => Activation::deriv_linear(x),
            Activation::Step => Activation::deriv_step(x),
            Activation::Sigmoid => Activation::deriv_sigmoid(x),
            Activation::HyperTan => Activation::deriv_hypertan(x),
            Activation::SiLU => Activation::deriv_si_lu(x),
            Activation::ReLU => Activation::deriv_re_lu(x),
            Activation::LeakyReLU => Activation::deriv_leaky_re_lu(x),
        }
    }

    fn deriv_linear(_x: f64) -> f64 {
        1.0
    }

    fn linear(x: f64) -> f64 {
        x
    }

    fn deriv_step(_x: f64) -> f64 {
        // Almost always 0
        0.0
    }

    fn step(x: f64) -> f64 {
        if x > 0.0 { 1.0 } else { 0.0 }
    }

    fn deriv_sigmoid(x: f64) -> f64 {
        let a = Activation::sigmoid(x);
        a * (1.0 - a)
    }

    fn sigmoid(x: f64) -> f64 {
        (1.0 + (-x).exp()).recip()
    }

    fn deriv_hypertan(x: f64) -> f64 {
        1.0 - x.tanh().powi(2)
    }

    fn hypertan(x: f64) -> f64 {
        x.tanh()
    }

    fn deriv_si_lu(x: f64) -> f64 {
        // This calculates x * Activation::deriv_sigmoid(x) + Activation::sigmoid(x) but only calculates the sigmoid once
        let sigm = Activation::sigmoid(x);
        // Use mul_add to reduce error
        x.mul_add(sigm * (1.0 - sigm), sigm)
    }

    fn si_lu(x: f64) -> f64 {
        let beta = 1.0;
        x * Activation::sigmoid(beta * x)
    }

    fn deriv_re_lu(x: f64) -> f64 {
        // I have chosen to make the derivative at 0 be 1.0 so I can do this for both ReLU and Leaky ReLU
        if x < 0.0 { 0.0 } else { 1.0 }
    }

    fn re_lu(x: f64) -> f64 {
        x.max(0.0)
    }

    fn deriv_leaky_re_lu(x: f64) -> f64 {
        if x < 0.0 { 0.15 } else { 1.0 }
    }

    fn leaky_re_lu(x: f64) -> f64 {
        x.max(x * 0.15)
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    fn floating_equal(a: f64, b: f64) -> bool {
        let tolerance = 0.0001;
        (a - b).abs() < tolerance
    }

    #[test]
    fn linear() {
        let act = Activation::Linear;

        for i in -100..=100 {
            assert_eq!(act.call(i as f64), i as f64);
        }
    }

    #[test]
    fn step() {
        // This should be pretty simple to test
        let act = Activation::Step;

        for i in -100..0 {
            assert_eq!(act.call(i as f64), 0.0);
        }

        for i in 1..=100 {
            assert_eq!(act.call(i as f64), 1.0);
        }
    }

    #[test]
    fn sigmoid() {
        let act = Activation::Sigmoid;
        assert_eq!(act.call(0.0), 0.5);
        // Assert that the S shape is there
        assert!(act.call(9999.0) > 0.999);
        assert!(act.call(-9999.0) < 0.001);
    }

    #[test]
    fn hypertan() {
        let act = Activation::HyperTan;
        assert_eq!(act.call(0.0), 0.0);

        assert!(act.call(9999.0) > 0.999);
        assert!(act.call(-9999.0) < -0.999);
    }

    #[test]
    fn si_lu() {
        let act = Activation::SiLU;
        // This is the low point in the dip.
        let si_lu_point = (-1.278465, -0.278465);

        // Test the begining of ReLU
        assert!(floating_equal(act.call(-15.0), 0.0));
        // Test the end of ReLU
        assert!(floating_equal(act.call(100.0), 100.0));
        // Test the swish/SiLU point
        assert!(floating_equal(act.call(si_lu_point.0), si_lu_point.1));
    }

    #[test]
    fn re_lu() {
        let act = Activation::ReLU;

        for i in -100..=0 {
            assert_eq!(act.call(i as f64), 0.0);
        }
        for i in 0..=100 {
            assert_eq!(act.call(i as f64), i as f64);
        }
    }

    #[test]
    fn leaky_re_lu() {
        let act = Activation::LeakyReLU;

        for i in -100..=0 {
            assert_eq!(act.call(i as f64), (i as f64) * 0.15);
        }
        for i in 0..=100 {
            assert_eq!(act.call(i as f64), i as f64);
        }
    }
}