Struct linfa_trees::DecisionTree

source · [−]

pub struct DecisionTree<F: Float, L: Label> { /* private fields */ }

Expand description

A fitted decision tree model for classification.

Structure

A decision tree structure is a binary tree where:

Each internal node specifies a decision, represented by a choice of a feature and a “split value” such that all observations for which feature <= split_value is true fall in the left subtree, while the others fall in the right subtree.
leaf nodes make predictions, and their prediction is the most popular label in the node

Algorithm

Starting with a single root node, decision trees are trained recursively by applying the following rule to every node considered:

Find the best split value for each feature of the observations belonging in the node;
Select the feature (and its best split value) that maximizes the quality of the split;
If the score of the split is sufficiently larger than the score of the unsplit node, then two child nodes are generated, the left one containing all observations with feature <= split value and the right one containing the rest.
If no suitable split is found, the node is marked as leaf and its prediction is set to be the most common label in the node;

The quality score used can be specified in the parameters.

To predict the label of a sample, the tree is traversed from the root to a leaf, choosing between left and right children according to the values of the features of the sample. The final prediction for the sample is the prediction of the reached leaf.

Additional constraints

In order to avoid overfitting the training data, some additional constraints on the quality/quantity of splits can be added to the tree. A description of these additional rules is provided in the parameters page.

Example

Here is an example on how to train a decision tree from its parameters:


use linfa_trees::DecisionTree;
use linfa::prelude::*;
use linfa_datasets;

// Load the dataset
let dataset = linfa_datasets::iris();
// Fit the tree
let tree = DecisionTree::params().fit(&dataset).unwrap();
// Get accuracy on training set
let accuracy = tree.predict(&dataset).confusion_matrix(&dataset).unwrap().accuracy();

assert!(accuracy > 0.9);

Struct linfa_trees::DecisionTree

Implementations

impl<F: Float, L: Label> DecisionTree<F, L>

pub fn iter_nodes(&self) -> NodeIter<'_, F, L>ⓘNotable traits for NodeIter<'a, F, L>impl<'a, F: Float, L: Debug + Label> Iterator for NodeIter<'a, F, L> type Item = &'a TreeNode<F, L>;

pub fn features(&self) -> Vec<usize>

pub fn mean_impurity_decrease(&self) -> Vec<F>

pub fn relative_impurity_decrease(&self) -> Vec<F>

pub fn feature_importance(&self) -> Vec<F>

pub fn root_node(&self) -> &TreeNode<F, L>

pub fn max_depth(&self) -> usize

pub fn num_leaves(&self) -> usize

pub fn export_to_tikz(&self) -> Tikz<'_, F, L>

impl<F: Float, L: Label> DecisionTree<F, L>

pub fn params() -> DecisionTreeParams<F, L>

Trait Implementations

impl<F: Clone + Float, L: Clone + Label> Clone for DecisionTree<F, L>

fn clone(&self) -> DecisionTree<F, L>

fn clone_from(&mut self, source: &Self)

impl<F: Debug + Float, L: Debug + Label> Debug for DecisionTree<F, L>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<F: PartialEq + Float, L: PartialEq + Label> PartialEq<DecisionTree<F, L>> for DecisionTree<F, L>

fn eq(&self, other: &DecisionTree<F, L>) -> bool

fn ne(&self, other: &DecisionTree<F, L>) -> bool

impl<F: Float, L: Label + Default, D: Data<Elem = F>> PredictInplace<ArrayBase<D, Dim<[usize; 2]>>, ArrayBase<OwnedRepr<L>, Dim<[usize; 1]>>> for DecisionTree<F, L>

fn predict_inplace(&self, x: &ArrayBase<D, Ix2>, y: &mut Array1<L>)

fn default_target(&self, x: &ArrayBase<D, Ix2>) -> Array1<L>

impl<F: Float, L: Label> StructuralPartialEq for DecisionTree<F, L>

Auto Trait Implementations

impl<F, L> RefUnwindSafe for DecisionTree<F, L> where F: RefUnwindSafe, L: RefUnwindSafe,

impl<F, L> Send for DecisionTree<F, L> where L: Send,

impl<F, L> Sync for DecisionTree<F, L> where L: Sync,

impl<F, L> Unpin for DecisionTree<F, L> where L: Unpin,

impl<F, L> UnwindSafe for DecisionTree<F, L> where F: UnwindSafe, L: UnwindSafe,

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

fn into(self) -> U

impl<T> Pointable for T

const ALIGN: usize = mem::align_of::()

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<'a, F, D, DM, T, O> Predict<&'a ArrayBase<D, DM>, T> for O where D: Data<Elem = F>, DM: Dimension, O: PredictInplace<ArrayBase<D, DM>, T>,

fn predict(&self, records: &'a ArrayBase<D, DM>) -> T

impl<'a, F, R, T, S, O> Predict<&'a DatasetBase<R, T>, S> for O where R: Records<Elem = F>, O: PredictInplace<R, S>,

fn predict(&self, ds: &'a DatasetBase<R, T>) -> S

impl<F, D, E, T, O> Predict<ArrayBase<D, Dim<[usize; 2]>>, DatasetBase<ArrayBase<D, Dim<[usize; 2]>>, T>> for O where D: Data<Elem = F>, T: AsTargets<Elem = E>, O: PredictInplace<ArrayBase<D, Dim<[usize; 2]>>, T>,

fn predict( &self, records: ArrayBase<D, Dim<[usize; 2]>>) -> DatasetBase<ArrayBase<D, Dim<[usize; 2]>>, T>

impl<F, R, T, E, S, O> Predict<DatasetBase<R, T>, DatasetBase<R, S>> for O where R: Records<Elem = F>, S: AsTargets<Elem = E>, O: PredictInplace<R, S>,

fn predict(&self, ds: DatasetBase<R, T>) -> DatasetBase<R, S>

impl<T> ToOwned for T where T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for T where V: MultiLane<T>,

fn vzip(self) -> V

pub fn iter_nodes(&self) -> NodeIter<'_, F, L>ⓘNotable traits for NodeIter<'a, F, L>`impl<'a, F: Float, L: Debug + Label> Iterator for NodeIter<'a, F, L> type Item = &'a TreeNode<F, L>;`

impl<F: Float, L: Label + Default, D: Data<Elem = F>> PredictInplace<ArrayBase<D, Dim<[usize ; 2]>>, ArrayBase<OwnedRepr<L>, Dim<[usize ; 1]>>> for DecisionTree<F, L>

impl<F, L> RefUnwindSafe for DecisionTree<F, L> where
F: RefUnwindSafe,
L: RefUnwindSafe,

impl<F, L> Send for DecisionTree<F, L> where
L: Send,

impl<F, L> Sync for DecisionTree<F, L> where
L: Sync,

impl<F, L> Unpin for DecisionTree<F, L> where
L: Unpin,

impl<F, L> UnwindSafe for DecisionTree<F, L> where
F: UnwindSafe,
L: UnwindSafe,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<'a, F, D, DM, T, O> Predict<&'a ArrayBase<D, DM>, T> for O where
D: Data<Elem = F>,
DM: Dimension,
O: PredictInplace<ArrayBase<D, DM>, T>,

impl<'a, F, R, T, S, O> Predict<&'a DatasetBase<R, T>, S> for O where
R: Records<Elem = F>,
O: PredictInplace<R, S>,

impl<F, D, E, T, O> Predict<ArrayBase<D, Dim<[usize ; 2]>>, DatasetBase<ArrayBase<D, Dim<[usize ; 2]>>, T>> for O where
D: Data<Elem = F>,
T: AsTargets<Elem = E>,
O: PredictInplace<ArrayBase<D, Dim<[usize ; 2]>>, T>,

fn predict(
&self,
records: ArrayBase<D, Dim<[usize ; 2]>>
) -> DatasetBase<ArrayBase<D, Dim<[usize ; 2]>>, T>

impl<F, R, T, E, S, O> Predict<DatasetBase<R, T>, DatasetBase<R, S>> for O where
R: Records<Elem = F>,
S: AsTargets<Elem = E>,
O: PredictInplace<R, S>,

impl<T> ToOwned for T where
T: Clone,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

impl<V, T> VZip<V> for T where
V: MultiLane<T>,