Struct forust_ml::gradientbooster::GradientBooster

source ·

pub struct GradientBooster {Show 28 fields
    pub objective_type: ObjectiveType,
    pub iterations: usize,
    pub learning_rate: f32,
    pub max_depth: usize,
    pub max_leaves: usize,
    pub l2: f32,
    pub gamma: f32,
    pub min_leaf_weight: f32,
    pub base_score: f64,
    pub nbins: u16,
    pub parallel: bool,
    pub allow_missing_splits: bool,
    pub monotone_constraints: Option<ConstraintMap>,
    pub subsample: f32,
    pub top_rate: f64,
    pub other_rate: f64,
    pub seed: u64,
    pub missing: f64,
    pub create_missing_branch: bool,
    pub sample_method: SampleMethod,
    pub grow_policy: GrowPolicy,
    pub evaluation_metric: Option<Metric>,
    pub early_stopping_rounds: Option<usize>,
    pub initialize_base_score: bool,
    pub evaluation_history: Option<RowMajorMatrix<f64>>,
    pub best_iteration: Option<usize>,
    pub prediction_iteration: Option<usize>,
    pub trees: Vec<Tree>,
    /* private fields */
}

Expand description

Gradient Booster object

objective_type - The name of objective function used to optimize. Valid options include “LogLoss” to use logistic loss as the objective function, or “SquaredLoss” to use Squared Error as the objective function.
iterations - Total number of trees to train in the ensemble.
learning_rate - Step size to use at each iteration. Each leaf weight is multiplied by this number. The smaller the value, the more conservative the weights will be.
max_depth - Maximum depth of an individual tree. Valid values are 0 to infinity.
max_leaves - Maximum number of leaves allowed on a tree. Valid values are 0 to infinity. This is the total number of final nodes.
l2 - L2 regularization term applied to the weights of the tree. Valid values are 0 to infinity.
gamma - The minimum amount of loss required to further split a node. Valid values are 0 to infinity.
min_leaf_weight - Minimum sum of the hessian values of the loss function required to be in a node.
base_score - The initial prediction value of the model.
nbins - Number of bins to calculate to partition the data. Setting this to a smaller number, will result in faster training time, while potentially sacrificing accuracy. If there are more bins, than unique values in a column, all unique values will be used.
allow_missing_splits - Should the algorithm allow splits that completed seperate out missing and non-missing values, in the case where create_missing_branch is false. When create_missing_branch is true, setting this to true will result in the missin branch being further split.
monotone_constraints - Constraints that are used to enforce a specific relationship between the training features and the target variable.
subsample - Percent of records to randomly sample at each iteration when training a tree.
top_rate - Used only in goss. The retain ratio of large gradient data.
other_rate - Used only in goss. the retain ratio of small gradient data.
seed - Integer value used to seed any randomness used in the algorithm.
missing - Value to consider missing.
create_missing_branch - Should missing be split out it’s own separate branch?
sample_method - Specify the method that records should be sampled when training?
evaluation_metric - Define the evaluation metric to record at each iterations.
early_stopping_rounds - Number of rounds where the evaluation metric value must improve in to keep training.
initialize_base_score - If this is specified, the base_score will be calculated using the sample_weight and y data in accordance with the requested objective_type.

Fields§

§objective_type: ObjectiveType§iterations: usize§learning_rate: f32§max_depth: usize§max_leaves: usize§l2: f32§gamma: f32§min_leaf_weight: f32§base_score: f64§nbins: u16§parallel: bool§allow_missing_splits: bool§monotone_constraints: Option<ConstraintMap>§subsample: f32§top_rate: f64§other_rate: f64§seed: u64§missing: f64§create_missing_branch: bool§sample_method: SampleMethod§grow_policy: GrowPolicy§evaluation_metric: Option<Metric>§early_stopping_rounds: Option<usize>§initialize_base_score: bool§evaluation_history: Option<RowMajorMatrix<f64>>§best_iteration: Option<usize>§prediction_iteration: Option<usize>

number of trees to use when predicting, defaults to best_iteration if this is defined.

§trees: Vec<Tree>

Struct forust_ml::gradientbooster::GradientBooster

Fields§

Implementations§

impl GradientBooster

pub fn fit( &mut self, data: &Matrix<'_, f64>, y: &[f64], sample_weight: &[f64], evaluation_data: Option<Vec<EvaluationData<'_>>> ) -> Result<(), ForustError>

pub fn fit_unweighted( &mut self, data: &Matrix<'_, f64>, y: &[f64], evaluation_data: Option<Vec<EvaluationData<'_>>> ) -> Result<(), ForustError>

pub fn predict(&self, data: &Matrix<'_, f64>, parallel: bool) -> Vec<f64>

pub fn predict_contributions( &self, data: &Matrix<'_, f64>, method: ContributionsMethod, parallel: bool ) -> Vec<f64>

pub fn value_partial_dependence(&self, feature: usize, value: f64) -> f64

pub fn save_booster(&self, path: &str) -> Result<(), ForustError>

pub fn json_dump(&self) -> Result<String, ForustError>

pub fn from_json(json_str: &str) -> Result<Self, ForustError>

pub fn load_booster(path: &str) -> Result<Self, ForustError>

pub fn set_objective_type(self, objective_type: ObjectiveType) -> Self

pub fn set_iterations(self, iterations: usize) -> Self

pub fn set_learning_rate(self, learning_rate: f32) -> Self

pub fn set_max_depth(self, max_depth: usize) -> Self

pub fn set_max_leaves(self, max_leaves: usize) -> Self

pub fn set_nbins(self, nbins: u16) -> Self

pub fn set_l2(self, l2: f32) -> Self

pub fn set_gamma(self, gamma: f32) -> Self

pub fn set_min_leaf_weight(self, min_leaf_weight: f32) -> Self

pub fn set_base_score(self, base_score: f64) -> Self

pub fn set_initialize_base_score(self, initialize_base_score: bool) -> Self

pub fn set_parallel(self, parallel: bool) -> Self

pub fn set_allow_missing_splits(self, allow_missing_splits: bool) -> Self

pub fn set_monotone_constraints( self, monotone_constraints: Option<ConstraintMap> ) -> Self

pub fn set_subsample(self, subsample: f32) -> Self

pub fn set_seed(self, seed: u64) -> Self

pub fn set_missing(self, missing: f64) -> Self

pub fn set_create_missing_branch(self, create_missing_branch: bool) -> Self

pub fn set_sample_method(self, sample_method: SampleMethod) -> Self

pub fn set_evaluation_metric(self, evaluation_metric: Option<Metric>) -> Self

pub fn set_early_stopping_rounds( self, early_stopping_rounds: Option<usize> ) -> Self

pub fn set_prediction_iteration( self, prediction_iteration: Option<usize> ) -> Self

pub fn insert_metadata(&mut self, key: String, value: String)

pub fn get_metadata(&self, key: &String) -> Option<String>

Trait Implementations§

impl Default for GradientBooster

fn default() -> Self

impl<'de> Deserialize<'de> for GradientBooster

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for GradientBooster

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl RefUnwindSafe for GradientBooster

impl Send for GradientBooster

impl Sync for GradientBooster

impl Unpin for GradientBooster

impl UnwindSafe for GradientBooster

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> Pointable for T

const ALIGN: usize = mem::align_of::<T>()

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>where S: Serializer,