DeepIron 0.1.4 - Docs.rs

//! A set of structs and functions for support vector machines.

use crate::data_loader::DataFrameTransformer;
use crate::model::activation_functions::{ActivationFunction, ActivationFunctionType};
use crate::model::kernel_functions::{KernelFunction, KernelFunctionType};
use crate::model::loss_functions::{LossFunction, LossFunctionType};
use crate::model::*;
use polars::prelude::*;
use polars::series::Series;

/// A struct that defines a support vector machine.
///
/// # Example
///
/// ```
/// let model = Model::SVM::new();
///
/// model.fit(&x, &y, num_epochs, learning_rate);
///
/// let y_pred = model.predict(&x);
///
/// ```
pub struct SVM {
    // Fields for training
    pub loss_function: LossFunctionType,
    pub activation_function: ActivationFunctionType,
    pub kernel_function: KernelFunctionType,

    // Fields to store results
    pub intercept: f64,
    pub coefficients: Vec<f64>,
}

impl SVM {
    /// Create a new SVM model.
    ///
    /// # Example
    ///
    /// ```
    /// let model = Model::SVM::new();
    /// ```
    pub fn new() -> SVM {
        SVM {
            loss_function: LossFunctionType::Hinge,
            activation_function: ActivationFunctionType::Identity,
            kernel_function: KernelFunctionType::Identity,
            intercept: 0.0,
            coefficients: Vec::new(),
        }
    }

    /// Compute the gradients for the model.
    /// 
    /// # Arguments
    /// 
    /// * `x` - The Series of input data.
    /// 
    /// * `y` - The Series of true values.
    /// 
    /// * `predictions` - The Series of predictions.
    /// 
    /// # Returns
    /// 
    /// A tuple containing the bias gradient and the weight gradients.
    /// 
    /// # Example
    /// 
    /// ```
    /// let (bias_gradient, weight_gradients) = model.compute_gradients(&x, &y, &predictions);
    /// 
    /// ```
    fn compute_gradients(
        &self,
        x: &DataFrame,
        y: &Series,
        predictions: &Series,
    ) -> (f64, Vec<f64>) {
        let mut weight_gradients: Vec<f64> = Vec::with_capacity(self.coefficients.len());
        let bias_gradient: f64 = self.loss_function.intercept_gradient(y, predictions);

        for (i, _) in self.coefficients.iter().enumerate() {
            let x_column: Series = x.get_col_by_index(i).unwrap();
            let x_column: &ChunkedArray<Float64Type> = x_column.f64().unwrap();

            // Calculate kernel values for each data point and prediction
            let kernel_values: Series = self
                .kernel_function
                .kernel(&x_column.clone().into_series(), predictions);

            // Convert kernel values to dataframe
            let kernel_values: DataFrame = DataFrame::new(vec![kernel_values]).unwrap();

            // Use kernel values directly in gradient calculation
            let gradient: f64 = self
                .loss_function
                .gradient(&kernel_values, y, predictions)
                .mean()
                .unwrap();
            weight_gradients.push(gradient);
        }

        (bias_gradient, weight_gradients)
    }
}

impl model::SupervisedModeller for SVM {
    /// Fit the model to the data.
    ///
    /// # Example
    ///
    /// ```
    /// let model = SVM::new();
    ///
    /// model.fit(&x, &y, num_epochs, learning_rate);
    /// ```
    fn fit(
        &mut self,
        x: &DataFrame,
        y: &Series,
        num_epochs: u32,
        learning_rate: f64,
    ) -> Result<(), PolarsError> {
        // Check if data are valid
        if x.shape().0 != y.len() {
            return Err(PolarsError::ShapeMismatch(
                "Shape mismatch between X and y".into(),
            ));
        }

        // Initialise coefficients
        for _ in 0..x.width() {
            self.coefficients.push(0.0);
        }

        for _ in 0..num_epochs {
            let predictions: Series = self.predict(x)?;
            let gradients: (f64, Vec<f64>) = self.compute_gradients(x, y, &predictions);

            self.intercept -= learning_rate * gradients.0;

            for (i, coefficient) in self.coefficients.iter_mut().enumerate() {
                *coefficient -= learning_rate * gradients.1[i];
            }
        }

        Ok(())
    }


    /// Predict the output of the model.
    /// 
    /// # Arguments
    /// 
    /// * `x` - The DataFrame of input data.
    /// 
    /// # Returns
    /// 
    /// The Series of predictions.
    /// 
    /// # Example
    /// 
    /// ```
    /// 
    /// let predictions = model.predict(&x);
    /// 
    /// ```
    fn predict(&self, x: &DataFrame) -> Result<Series, PolarsError> {
        let mut predictions: Series = Series::new("prediction", vec![self.intercept; x.height()]);

        for (i, coefficient) in self.coefficients.iter().enumerate() {
            let x_column: Series = x.get_col_by_index(i).unwrap();
            let x_column: &ChunkedArray<Float64Type> = x_column.f64().unwrap();
            let prediction: Series = (x_column * *coefficient).into_series();
            predictions = predictions + prediction;
        }

        // Run activation function
        predictions = self.activation_function.activate(&predictions);

        Ok(predictions)
    }

    fn accuracy(&self, x: &DataFrame, y: &Series) -> Result<f64, PolarsError> {
        let predictions: Series = self.predict(x)?;
        let predictions: Series = self.activation_function.activate(&predictions);
        let predictions: Series = predictions.gt_eq(y).unwrap().into_series();
        let accuracy: f64 = predictions.sum::<u32>().unwrap() as f64 / predictions.len() as f64;

        Ok(accuracy)
    }

    fn loss(&self, x: &DataFrame, y: &Series) -> Result<f64, PolarsError> {
        let predictions: Series = self.predict(x)?;
        let loss: f64 = self.loss_function.loss(&predictions, y);

        Ok(loss)
    }
}