[−][src]Struct gbdt::gradient_boost::GBDT

pub struct GBDT { /* fields omitted */ }

The gradient boosting decision tree.

Methods

`impl GBDT`[src]

`pub fn new(conf: &Config) -> GBDT`[src]

Return a new gbdt with manually set config.

Example

use gbdt::config::Config;
use gbdt::gradient_boost::GBDT;

// set config for algorithm
let mut cfg = Config::new();
cfg.set_feature_size(3);
cfg.set_max_depth(2);
cfg.set_min_leaf_size(1);
cfg.set_loss("SquaredError");
cfg.set_iterations(2);

// initialize GBDT algorithm
let mut gbdt = GBDT::new(&cfg);

`pub fn fit(&mut self, train_data: &mut DataVec)`[src]

Fit the train data.

First, initialize and configure decision trees. Then train the model with certain iterations set by config.

Example

use gbdt::config::Config;
use gbdt::gradient_boost::GBDT;
use gbdt::decision_tree::{Data, DataVec, PredVec, ValueType};

// set config for algorithm
let mut cfg = Config::new();
cfg.set_feature_size(3);
cfg.set_max_depth(2);
cfg.set_min_leaf_size(1);
cfg.set_loss("SquaredError");
cfg.set_iterations(2);

// initialize GBDT algorithm
let mut gbdt = GBDT::new(&cfg);

// setup training data
let data1 = Data::new_training_data (
    vec![1.0, 2.0, 3.0],
    1.0,
    1.0,
    None
);
let data2 = Data::new_training_data (
    vec![1.1, 2.1, 3.1],
    1.0,
    1.0,
    None
);
let data3 = Data::new_training_data (
    vec![2.0, 2.0, 1.0],
    1.0,
    2.0,
    None
);
let data4 = Data::new_training_data (
    vec![2.0, 2.3, 1.2],
    1.0,
    0.0,
    None
);

let mut training_data: DataVec = Vec::new();
training_data.push(data1.clone());
training_data.push(data2.clone());
training_data.push(data3.clone());
training_data.push(data4.clone());

// train the decision trees.
gbdt.fit(&mut training_data);

`pub fn predict(&self, test_data: &DataVec) -> PredVec`[src]

Predict the given data.

Note that for log likelyhood loss type, the predicted value will be normalized between 0 and 1, which is the possibility of label 1

Example

use gbdt::config::Config;
use gbdt::gradient_boost::GBDT;
use gbdt::decision_tree::{Data, DataVec, PredVec, ValueType};

// set config for algorithm
let mut cfg = Config::new();
cfg.set_feature_size(3);
cfg.set_max_depth(2);
cfg.set_min_leaf_size(1);
cfg.set_loss("SquaredError");
cfg.set_iterations(2);

// initialize GBDT algorithm
let mut gbdt = GBDT::new(&cfg);

// setup training data
let data1 = Data::new_training_data (
    vec![1.0, 2.0, 3.0],
    1.0,
    1.0,
    None
);
let data2 = Data::new_training_data (
    vec![1.1, 2.1, 3.1],
    1.0,
    1.0,
    None
);
let data3 = Data::new_training_data (
    vec![2.0, 2.0, 1.0],
    1.0,
    2.0,
    None
);
let data4 = Data::new_training_data (
    vec![2.0, 2.3, 1.2],
    1.0,
    0.0,
    None
);

let mut training_data: DataVec = Vec::new();
training_data.push(data1.clone());
training_data.push(data2.clone());
training_data.push(data3.clone());
training_data.push(data4.clone());

// train the decision trees.
gbdt.fit(&mut training_data);

// setup the test data

let mut test_data: DataVec = Vec::new();
test_data.push(data1.clone());
test_data.push(data2.clone());
test_data.push(data3.clone());
test_data.push(data4.clone());

println!("{:?}", gbdt.predict(&test_data));

Panic

If the training process is not completed, thus, the number of trees that have been is less than the iteration configuration in self.conf, it will panic.

`pub fn predict_multiclass( &self, test_data: &DataVec, class_num: usize ) -> (Vec<usize>, Vec<Vec<ValueType>>)`[src]

Predict multi class data and return the probabilities for each class. The loss type should be "multi:softmax" or "multi:softprob"

test_data: the test set

class_num: the number of class

output: the predicted class label, the predicted possiblity for each class

Example

use gbdt::gradient_boost::GBDT;
use gbdt::input::{load, InputFormat};
use gbdt::decision_tree::DataVec;
let gbdt =
    GBDT::from_xgoost_dump("xgb-data/xgb_multi_softmax/gbdt.model", "multi:softmax").unwrap();
let test_file = "xgb-data/xgb_multi_softmax/dermatology.data.test";
let mut fmt = InputFormat::csv_format();
fmt.set_label_index(34);
let test_data: DataVec = load(test_file, fmt).unwrap();
let (labels, probs) = gbdt.predict_multiclass(&test_data, 6);

`pub fn print_trees(&self)`[src]

Print the tress for debug

Example

use gbdt::config::Config;
use gbdt::gradient_boost::GBDT;
use gbdt::decision_tree::{Data, DataVec, PredVec, ValueType};

// set config for algorithm
let mut cfg = Config::new();
cfg.set_feature_size(3);
cfg.set_max_depth(2);
cfg.set_min_leaf_size(1);
cfg.set_loss("SquaredError");
cfg.set_iterations(2);

// initialize GBDT algorithm
let mut gbdt = GBDT::new(&cfg);

// setup training data
let data1 = Data::new_training_data (
    vec![1.0, 2.0, 3.0],
    1.0,
    1.0,
    None
);
let data2 = Data::new_training_data (
    vec![1.1, 2.1, 3.1],
    1.0,
    1.0,
    None
);
let data3 = Data::new_training_data (
    vec![2.0, 2.0, 1.0],
    1.0,
    2.0,
    None
);
let data4 = Data::new_training_data (
    vec![2.0, 2.3, 1.2],
    1.0,
    0.0,
    None
);

let mut dv: DataVec = Vec::new();
dv.push(data1.clone());
dv.push(data2.clone());
dv.push(data3.clone());
dv.push(data4.clone());

// train the decision trees.
gbdt.fit(&mut dv);

// print the tree.
gbdt.print_trees();

`pub fn save_model(&self, filename: &str) -> Result<(), Box<dyn Error>>`[src]

Save the model to a file using serde.

Example

use gbdt::config::Config;
use gbdt::gradient_boost::GBDT;
use gbdt::decision_tree::{Data, DataVec, PredVec, ValueType};

// set config for algorithm
let mut cfg = Config::new();
cfg.set_feature_size(3);
cfg.set_max_depth(2);
cfg.set_min_leaf_size(1);
cfg.set_loss("SquaredError");
cfg.set_iterations(2);

// initialize GBDT algorithm
let mut gbdt = GBDT::new(&cfg);

// setup training data
let data1 = Data::new_training_data (
    vec![1.0, 2.0, 3.0],
    1.0,
    1.0,
    None
);
let data2 = Data::new_training_data (
    vec![1.1, 2.1, 3.1],
    1.0,
    1.0,
    None
);
let data3 = Data::new_training_data (
    vec![2.0, 2.0, 1.0],
    1.0,
    2.0,
    None
);
let data4 = Data::new_training_data (
    vec![2.0, 2.3, 1.2],
    1.0,
    0.0,
    None
);

let mut dv: DataVec = Vec::new();
dv.push(data1.clone());
dv.push(data2.clone());
dv.push(data3.clone());
dv.push(data4.clone());

// train the decision trees.
gbdt.fit(&mut dv);

// Save model.
// gbdt.save_model("gbdt.model");

`pub fn load_model(filename: &str) -> Result<Self, Box<dyn Error>>`[src]

Load the model from the file.

Example

use gbdt::gradient_boost::GBDT;
//let gbdt = GBDT::load_model("./gbdt-rs.model").unwrap();

Error

Error when get exception during model file parsing or deserialize.

`pub fn from_xgoost_dump( model_file: &str, objective: &str ) -> Result<Self, Box<dyn Error>>`[src]

Load the model from xgboost's model. The xgboost's model should be converted by "convert_xgboost.py"

Example

use gbdt::gradient_boost::GBDT;
let gbdt =
    GBDT::from_xgoost_dump("xgb-data/xgb_binary_logistic/gbdt.model", "binary:logistic").unwrap();

Error

Error when get exception during model file parsing.

Trait Implementations

`impl Default for GBDT`[src]

`fn default() -> GBDT`[src]

`impl Serialize for GBDT`[src]

`fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error> where S: Serializer,` [src]

`impl<'de> Deserialize<'de> for GBDT`[src]

`fn deserialize<D>(deserializer: D) -> Result<Self, D::Error> where __D: Deserializer<'de>,` [src]

Auto Trait Implementations

`impl Send for GBDT`

`impl Sync for GBDT`

Blanket Implementations

`impl<T> From<T> for T`[src]

`fn from(t: T) -> T`[src]

`impl<T, U> Into for T where U: From<T>,` [src]

`fn into(self) -> U`[src]

`impl<T, U> TryFrom for T where U: Into<T>,` [src]

`type Error = Infallible`

The type returned in the event of a conversion error.

`fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>`[src]

`impl<T, U> TryInto for T where U: TryFrom<T>,` [src]

`type Error = >::Error`

The type returned in the event of a conversion error.

[−][src]Struct gbdt::gradient_boost::GBDT

Methods

impl GBDT[src]

pub fn new(conf: &Config) -> GBDT[src]

pub fn fit(&mut self, train_data: &mut DataVec)[src]

pub fn predict(&self, test_data: &DataVec) -> PredVec[src]

pub fn predict_multiclass( &self, test_data: &DataVec, class_num: usize) -> (Vec<usize>, Vec<Vec<ValueType>>)[src]

pub fn print_trees(&self)[src]

pub fn save_model(&self, filename: &str) -> Result<(), Box<dyn Error>>[src]

pub fn load_model(filename: &str) -> Result<Self, Box<dyn Error>>[src]

pub fn from_xgoost_dump( model_file: &str, objective: &str) -> Result<Self, Box<dyn Error>>[src]

Trait Implementations

impl Default for GBDT[src]

fn default() -> GBDT[src]

impl Serialize for GBDT[src]

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error> where __S: Serializer, [src]

impl<'de> Deserialize<'de> for GBDT[src]

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error> where __D: Deserializer<'de>, [src]

Auto Trait Implementations

impl Send for GBDT

impl Sync for GBDT

Blanket Implementations

impl<T> From<T> for T[src]

fn from(t: T) -> T[src]

impl<T, U> Into<U> for T where U: From<T>, [src]

fn into(self) -> U[src]

impl<T, U> TryFrom<U> for T where U: Into<T>, [src]

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>[src]

impl<T, U> TryInto<U> for T where U: TryFrom<T>, [src]

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>[src]

impl<T> BorrowMut<T> for T where T: ?Sized, [src]

fn borrow_mut(&mut self) -> &mut T[src]

impl<T> Borrow<T> for T where T: ?Sized, [src]

fn borrow(&self) -> &T[src]

impl<T> Any for T where T: 'static + ?Sized, [src]

fn type_id(&self) -> TypeId[src]

impl<T> DeserializeOwned for T where T: Deserialize<'de>, [src]

`impl GBDT`[src]

`pub fn new(conf: &Config) -> GBDT`[src]

`pub fn fit(&mut self, train_data: &mut DataVec)`[src]

`pub fn predict(&self, test_data: &DataVec) -> PredVec`[src]

`pub fn predict_multiclass( &self, test_data: &DataVec, class_num: usize ) -> (Vec<usize>, Vec<Vec<ValueType>>)`[src]

`pub fn print_trees(&self)`[src]

`pub fn save_model(&self, filename: &str) -> Result<(), Box<dyn Error>>`[src]

`pub fn load_model(filename: &str) -> Result<Self, Box<dyn Error>>`[src]

`pub fn from_xgoost_dump( model_file: &str, objective: &str ) -> Result<Self, Box<dyn Error>>`[src]

`impl Default for GBDT`[src]

`fn default() -> GBDT`[src]

`impl Serialize for GBDT`[src]

`fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error> where S: Serializer,` [src]

`impl<'de> Deserialize<'de> for GBDT`[src]

`fn deserialize<D>(deserializer: D) -> Result<Self, D::Error> where __D: Deserializer<'de>,` [src]

`impl Send for GBDT`

`impl Sync for GBDT`

`impl<T> From<T> for T`[src]

`fn from(t: T) -> T`[src]

`impl<T, U> Into<U> for T where U: From<T>,` [src]

`fn into(self) -> U`[src]

`impl<T, U> TryFrom<U> for T where U: Into<T>,` [src]

`type Error = Infallible`

`fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>`[src]

`impl<T, U> TryInto<U> for T where U: TryFrom<T>,` [src]

`type Error = <U as TryFrom<T>>::Error`

`fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>`[src]

`impl<T> BorrowMut<T> for T where T: ?Sized,` [src]

`fn borrow_mut(&mut self) -> &mut T`[src]

`impl<T> Borrow<T> for T where T: ?Sized,` [src]

`fn borrow(&self) -> &T`[src]

`impl<T> Any for T where T: 'static + ?Sized,` [src]

`fn type_id(&self) -> TypeId`[src]

`impl<T> DeserializeOwned for T where T: Deserialize<'de>,` [src]