Struct forust_ml::gradientbooster::GradientBooster

source ·

pub struct GradientBooster {Show 35 fields
    pub objective_type: ObjectiveType,
    pub iterations: usize,
    pub learning_rate: f32,
    pub max_depth: usize,
    pub max_leaves: usize,
    pub l1: f32,
    pub l2: f32,
    pub gamma: f32,
    pub max_delta_step: f32,
    pub min_leaf_weight: f32,
    pub base_score: f64,
    pub nbins: u16,
    pub parallel: bool,
    pub allow_missing_splits: bool,
    pub monotone_constraints: Option<ConstraintMap>,
    pub subsample: f32,
    pub top_rate: f64,
    pub other_rate: f64,
    pub colsample_bytree: f64,
    pub seed: u64,
    pub missing: f64,
    pub create_missing_branch: bool,
    pub sample_method: SampleMethod,
    pub grow_policy: GrowPolicy,
    pub evaluation_metric: Option<Metric>,
    pub early_stopping_rounds: Option<usize>,
    pub initialize_base_score: bool,
    pub terminate_missing_features: HashSet<usize>,
    pub evaluation_history: Option<RowMajorMatrix<f64>>,
    pub best_iteration: Option<usize>,
    pub prediction_iteration: Option<usize>,
    pub missing_node_treatment: MissingNodeTreatment,
    pub log_iterations: usize,
    pub force_children_to_bound_parent: bool,
    pub trees: Vec<Tree>,
    /* private fields */
}

Expand description

Gradient Booster object

Fields§

§objective_type: ObjectiveType

The name of objective function used to optimize. Valid options include “LogLoss” to use logistic loss as the objective function, or “SquaredLoss” to use Squared Error as the objective function.

§iterations: usize

Total number of trees to train in the ensemble.

§learning_rate: f32

Step size to use at each iteration. Each leaf weight is multiplied by this number. The smaller the value, the more conservative the weights will be.

§max_depth: usize

Maximum depth of an individual tree. Valid values are 0 to infinity.

§max_leaves: usize

Maximum number of leaves allowed on a tree. Valid values are 0 to infinity. This is the total number of final nodes.

§l1: f32

L1 regularization term applied to the weights of the tree. Valid values are 0 to infinity. 0 Means no regularization applied.

§l2: f32

L2 regularization term applied to the weights of the tree. Valid values are 0 to infinity.

§gamma: f32

The minimum amount of loss required to further split a node. Valid values are 0 to infinity.

§max_delta_step: f32

Maximum delta step allowed at each leaf. This is the maximum magnitude a leaf can take. Setting to 0 results in no constrain.

§min_leaf_weight: f32

Minimum sum of the hessian values of the loss function required to be in a node.

§base_score: f64

The initial prediction value of the model.

§nbins: u16

Number of bins to calculate to partition the data. Setting this to a smaller number, will result in faster training time, while potentially sacrificing accuracy. If there are more bins, than unique values in a column, all unique values will be used.

§parallel: bool§allow_missing_splits: bool

Should the algorithm allow splits that completed seperate out missing and non-missing values, in the case where create_missing_branch is false. When create_missing_branch is true, setting this to true will result in the missin branch being further split.

§monotone_constraints: Option<ConstraintMap>

Constraints that are used to enforce a specific relationship between the training features and the target variable.

§subsample: f32

Percent of records to randomly sample at each iteration when training a tree.

§top_rate: f64

Used only in goss. The retain ratio of large gradient data.

§other_rate: f64

Used only in goss. the retain ratio of small gradient data.

§colsample_bytree: f64

Specify the fraction of columns that should be sampled at each iteration, valid values are in the range (0.0,1.0].

§seed: u64

Integer value used to seed any randomness used in the algorithm.

§missing: f64

Value to consider missing.

§create_missing_branch: bool

Should missing be split out it’s own separate branch?

§sample_method: SampleMethod

Specify the method that records should be sampled when training?

§grow_policy: GrowPolicy

Growth policy to use when training a tree, this is how the next node is selected.

§evaluation_metric: Option<Metric>

Define the evaluation metric to record at each iterations.

§early_stopping_rounds: Option<usize>

Number of rounds where the evaluation metric value must improve in to keep training.

§initialize_base_score: bool

If this is specified, the base_score will be calculated using the sample_weight and y data in accordance with the requested objective_type.

§terminate_missing_features: HashSet<usize>

A set of features for which the missing node will always be terminated, even if allow_missing_splits is set to true. This value is only valid if create_missing_branch is also True.

§evaluation_history: Option<RowMajorMatrix<f64>>

A matrix of the evaluation history on the evaluation datasets.

§best_iteration: Option<usize>§prediction_iteration: Option<usize>

Number of trees to use when predicting, defaults to best_iteration if this is defined.

§missing_node_treatment: MissingNodeTreatment

How the missing nodes weights should be treated at training time.

§log_iterations: usize

Should the model be trained showing output.

§force_children_to_bound_parent: bool

Should the children nodes contain the parent node in their bounds, setting this to true, will result in no children being created that result in the higher and lower child values both being greater than, or less than the parent weight.

§trees: Vec<Tree>

Struct forust_ml::gradientbooster::GradientBoosterCopy item path

Fields§

Implementations§

impl GradientBooster

pub fn fit( &mut self, data: &Matrix<'_, f64>, y: &[f64], sample_weight: &[f64], evaluation_data: Option<Vec<EvaluationData<'_>>> ) -> Result<(), ForustError>

pub fn fit_unweighted( &mut self, data: &Matrix<'_, f64>, y: &[f64], evaluation_data: Option<Vec<EvaluationData<'_>>> ) -> Result<(), ForustError>

pub fn predict(&self, data: &Matrix<'_, f64>, parallel: bool) -> Vec<f64>

pub fn predict_leaf_indices(&self, data: &Matrix<'_, f64>) -> Vec<usize>

pub fn predict_contributions( &self, data: &Matrix<'_, f64>, method: ContributionsMethod, parallel: bool ) -> Vec<f64>

pub fn value_partial_dependence(&self, feature: usize, value: f64) -> f64

pub fn calculate_feature_importance( &self, method: ImportanceMethod, normalize: bool ) -> HashMap<usize, f32>

pub fn save_booster(&self, path: &str) -> Result<(), ForustError>

pub fn json_dump(&self) -> Result<String, ForustError>

pub fn from_json(json_str: &str) -> Result<Self, ForustError>

pub fn load_booster(path: &str) -> Result<Self, ForustError>

pub fn set_objective_type(self, objective_type: ObjectiveType) -> Self

pub fn set_iterations(self, iterations: usize) -> Self

pub fn set_learning_rate(self, learning_rate: f32) -> Self

pub fn set_max_depth(self, max_depth: usize) -> Self

pub fn set_max_leaves(self, max_leaves: usize) -> Self

pub fn set_nbins(self, nbins: u16) -> Self

pub fn set_l1(self, l1: f32) -> Self

pub fn set_l2(self, l2: f32) -> Self

pub fn set_gamma(self, gamma: f32) -> Self

pub fn set_max_delta_step(self, max_delta_step: f32) -> Self

pub fn set_min_leaf_weight(self, min_leaf_weight: f32) -> Self

pub fn set_base_score(self, base_score: f64) -> Self

pub fn set_initialize_base_score(self, initialize_base_score: bool) -> Self

pub fn set_parallel(self, parallel: bool) -> Self

pub fn set_allow_missing_splits(self, allow_missing_splits: bool) -> Self

pub fn set_monotone_constraints( self, monotone_constraints: Option<ConstraintMap> ) -> Self

pub fn set_subsample(self, subsample: f32) -> Self

pub fn set_colsample_bytree(self, colsample_bytree: f64) -> Self

pub fn set_seed(self, seed: u64) -> Self

pub fn set_missing(self, missing: f64) -> Self

pub fn set_create_missing_branch(self, create_missing_branch: bool) -> Self

pub fn set_sample_method(self, sample_method: SampleMethod) -> Self

pub fn set_evaluation_metric(self, evaluation_metric: Option<Metric>) -> Self

pub fn set_early_stopping_rounds( self, early_stopping_rounds: Option<usize> ) -> Self

pub fn set_prediction_iteration( self, prediction_iteration: Option<usize> ) -> Self

pub fn set_terminate_missing_features( self, terminate_missing_features: HashSet<usize> ) -> Self

pub fn insert_metadata(&mut self, key: String, value: String)

pub fn get_metadata(&self, key: &String) -> Option<String>

Trait Implementations§

impl Default for GradientBooster

fn default() -> Self

impl<'de> Deserialize<'de> for GradientBooster

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

impl Serialize for GradientBooster

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl Freeze for GradientBooster

impl RefUnwindSafe for GradientBooster

impl Send for GradientBooster

impl Sync for GradientBooster

impl Unpin for GradientBooster

impl UnwindSafe for GradientBooster

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize = _

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

Struct forust_ml::gradientbooster::GradientBooster

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where __D: Deserializer<'de>,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>
where S: Serializer,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,