Struct linfa::dataset::DatasetBase

source · [−]

pub struct DatasetBase<R, T> where
    R: Records,  {
    pub records: R,
    pub targets: T,
    pub weights: Array1<f32>,
    /* private fields */
}

Expand description

DatasetBase

This is the fundamental structure of a dataset. It contains a number of records about the data and may contain targets, weights and feature names. In order to keep the type complexity low the dataset base is only generic over the records and targets and introduces a trait bound on the records. weights and feature_names, on the other hand, are always assumed to be owned and copied when views are created.

Fields

records: a two-dimensional matrix with dimensionality (nsamples, nfeatures), in case of kernel methods a quadratic matrix with dimensionality (nsamples, nsamples), which may be sparse
targets: a two-/one-dimension matrix with dimensionality (nsamples, ntargets)
weights: optional weights for each sample with dimensionality (nsamples)
feature_names: optional descriptive feature names with dimensionality (nfeatures)

Trait bounds

R: Records: generic over feature matrices or kernel matrices
T: generic over any ndarray matrix which can be used as targets. The AsTargets trait bound is omitted here to avoid some repetition in implementation src/dataset/impl_dataset.rs

Fields

records: Rtargets: Tweights: Array1<f32>

Struct linfa::dataset::DatasetBase

Fields

Implementations

impl<F: Float, D: Data<Elem = F>, T> DatasetBase<ArrayBase<D, Ix2>, T>

pub fn pearson_correlation(&self) -> PearsonCorrelation<F>

pub fn pearson_correlation_with_p_value( &self, num_iter: usize) -> PearsonCorrelation<F>

impl<R: Records, S> DatasetBase<R, S>

pub fn new(records: R, targets: S) -> DatasetBase<R, S>

pub fn targets(&self) -> &S

pub fn weights(&self) -> Option<&[f32]>

pub fn weight_for(&self, idx: usize) -> f32

pub fn feature_names(&self) -> Vec<String>

pub fn records(&self) -> &R

pub fn with_records<T: Records>(self, records: T) -> DatasetBase<T, S>

pub fn with_targets<T>(self, targets: T) -> DatasetBase<R, T>

pub fn with_weights(self, weights: Array1<f32>) -> DatasetBase<R, S>

pub fn with_feature_names<I: Into<String>>( self, names: Vec<I>) -> DatasetBase<R, S>

impl<L, R: Records, T: AsTargets<Elem = L>> DatasetBase<R, T>

pub fn map_targets<S, G: FnMut(&L) -> S>( self, fnc: G) -> DatasetBase<R, Array<S, T::Ix>>

pub fn ntargets(&self) -> usize

impl<'a, F, L, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where D: Data<Elem = F>, T: AsTargets<Elem = L>,

pub fn sample_iter(&'a self) -> Iter<'a, '_, F, T::Elem, T::Ix>

impl<'a, F: 'a, L: 'a, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where D: Data<Elem = F>, T: AsTargets<Elem = L> + FromTargetArray<'a>,

pub fn view(&'a self) -> DatasetBase<ArrayView2<'a, F>, T::View>

pub fn feature_iter(&'a self) -> DatasetIter<'a, '_, ArrayBase<D, Ix2>, T>

pub fn target_iter(&'a self) -> DatasetIter<'a, '_, ArrayBase<D, Ix2>, T>

impl<'a, L: 'a, F, T> DatasetBase<ArrayView2<'a, F>, T> where T: AsTargets<Elem = L> + FromTargetArray<'a>,

pub fn split_with_ratio( &'a self, ratio: f32) -> (DatasetBase<ArrayView2<'a, F>, T::View>, DatasetBase<ArrayView2<'a, F>, T::View>)

impl<'a, 'b: 'a, F, L: Label, T, D> DatasetBase<ArrayBase<D, Ix2>, T> where D: Data<Elem = F>, T: AsSingleTargets<Elem = L> + Labels<Elem = L>,

pub fn one_vs_all( &self) -> Result<Vec<(L, DatasetBase<ArrayView2<'_, F>, CountedTargets<bool, Array1<bool>>>)>>

impl<L: Label, R: Records, S: AsTargets<Elem = L>> DatasetBase<R, S>

pub fn label_frequencies_with_mask(&self, mask: &[bool]) -> HashMap<L, f32>

pub fn label_frequencies(&self) -> HashMap<L, f32>

impl<'b, F: Clone, E: Copy + 'b, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where D: Data<Elem = F>, T: FromTargetArray<'b, Elem = E>, T::Owned: AsTargets,

pub fn bootstrap<R: Rng>( &'b self, sample_feature_size: (usize, usize), rng: &'b mut R) -> impl Iterator<Item = DatasetBase<Array2<F>, <T as FromTargetArray<'b>>::Owned>> + 'b

pub fn bootstrap_samples<R: Rng>( &'b self, num_samples: usize, rng: &'b mut R) -> impl Iterator<Item = DatasetBase<Array2<F>, <T as FromTargetArray<'b>>::Owned>> + 'b

pub fn bootstrap_features<R: Rng>( &'b self, num_features: usize, rng: &'b mut R) -> impl Iterator<Item = DatasetBase<Array2<F>, <T as FromTargetArray<'b>>::Owned>> + 'b

pub fn shuffle<R: Rng>(&self, rng: &mut R) -> DatasetBase<Array2<F>, T::Owned>

pub fn fold( &self, k: usize) -> Vec<(DatasetBase<Array2<F>, T::Owned>, DatasetBase<Array2<F>, T::Owned>)>

pub fn sample_chunks<'a: 'b>( &'b self, chunk_size: usize) -> ChunksIter<'b, 'a, F, T>

pub fn to_owned(&self) -> DatasetBase<Array2<F>, T::Owned>

impl<'a, F: 'a + Clone, E: Copy + 'a, D, S, I: TargetDim> DatasetBase<ArrayBase<D, Ix2>, ArrayBase<S, I>> where D: DataMut<Elem = F>, S: DataMut<Elem = E>,

pub fn iter_fold<O, C: Fn(&DatasetView<'_, F, E, I>) -> O>( &'a mut self, k: usize, fit_closure: C) -> impl Iterator<Item = (O, DatasetBase<ArrayView2<'_, F>, ArrayView<'_, E, I>>)>

impl<'a, F: 'a + Clone, E: Copy + 'a, D, S> DatasetBase<ArrayBase<D, Ix2>, ArrayBase<S, Ix1>> where D: DataMut<Elem = F>, S: DataMut<Elem = E>,

impl<F, E, I: TargetDim> DatasetBase<ArrayBase<OwnedRepr<D>, Dim<[usize; 2]>>, ArrayBase<OwnedRepr<T>, I>>

pub fn split_with_ratio(self, ratio: f32) -> (Self, Self)

impl<F: Copy, L: Copy + Label, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where D: Data<Elem = F>, T: AsTargets<Elem = L>,

pub fn with_labels( &self, labels: &[L]) -> DatasetBase<Array2<F>, CountedTargets<L, Array<L, T::Ix>>>

Trait Implementations

impl<L, R: Records, T: AsTargets<Elem = L>> AsTargets for DatasetBase<R, T>

type Elem = L

type Ix = <T as AsTargets>::Ix

fn as_targets(&self) -> ArrayView<'_, Self::Elem, Self::Ix>

impl<L, R: Records, T: AsTargetsMut<Elem = L>> AsTargetsMut for DatasetBase<R, T>

type Elem = L

type Ix = <T as AsTargetsMut>::Ix

fn as_targets_mut(&mut self) -> ArrayViewMut<'_, Self::Elem, Self::Ix>

impl<R: Records, R2: Records, T: AsSingleTargets<Elem = bool>, T2: AsSingleTargets<Elem = Pr>> BinaryClassification<&'_ DatasetBase<R, T>> for DatasetBase<R2, T2>

fn log_loss(&self, y: &DatasetBase<R, T>) -> Result<f32>

fn roc(&self, y: &DatasetBase<R, T>) -> Result<ReceiverOperatingCharacteristic>

impl<R: Clone, T: Clone> Clone for DatasetBase<R, T> where R: Records,

fn clone(&self) -> DatasetBase<R, T>

fn clone_from(&mut self, source: &Self)

impl<R: Debug, T: Debug> Debug for DatasetBase<R, T> where R: Records,

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<F, E, D, S, I: TargetDim> From<(ArrayBase<D, Dim<[usize; 2]>>, ArrayBase<S, I>)> for DatasetBase<ArrayBase<D, Ix2>, ArrayBase<S, I>> where D: Data<Elem = F>, S: Data<Elem = E>,

fn from(rec_tar: (ArrayBase<D, Ix2>, ArrayBase<S, I>)) -> Self

impl<F, D: Data<Elem = F>, I: Dimension> From<ArrayBase<D, I>> for DatasetBase<ArrayBase<D, I>, Array1<()>>

fn from(records: ArrayBase<D, I>) -> Self

impl<L: Label, T: Labels<Elem = L>, R: Records> Labels for DatasetBase<R, T>

type Elem = L

fn label_count(&self) -> Vec<HashMap<L, usize>>

fn label_set(&self) -> Vec<HashSet<Self::Elem>>

fn labels(&self) -> Vec<Self::Elem>

impl<F: Float, T: AsMultiTargets<Elem = F>, T2: AsMultiTargets<Elem = F>, D: Data<Elem = F>> MultiTargetRegression<F, T2> for DatasetBase<ArrayBase<D, Ix2>, T>

fn max_error(&self, other: &T) -> Result<Array1<F>>

fn mean_absolute_error(&self, other: &T) -> Result<Array1<F>>

fn mean_squared_error(&self, other: &T) -> Result<Array1<F>>

fn mean_squared_log_error(&self, other: &T) -> Result<Array1<F>>

fn median_absolute_error(&self, other: &T) -> Result<Array1<F>>

pub fn pearson_correlation_with_p_value(
&self,
num_iter: usize
) -> PearsonCorrelation<F>

pub fn with_feature_names<I: Into<String>>(
self,
names: Vec<I>
) -> DatasetBase<R, S>

pub fn map_targets<S, G: FnMut(&L) -> S>(
self,
fnc: G
) -> DatasetBase<R, Array<S, T::Ix>>

impl<'a, F, L, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where
D: Data<Elem = F>,
T: AsTargets<Elem = L>,

impl<'a, F: 'a, L: 'a, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where
D: Data<Elem = F>,
T: AsTargets<Elem = L> + FromTargetArray<'a>,

impl<'a, L: 'a, F, T> DatasetBase<ArrayView2<'a, F>, T> where
T: AsTargets<Elem = L> + FromTargetArray<'a>,

pub fn split_with_ratio(
&'a self,
ratio: f32
) -> (DatasetBase<ArrayView2<'a, F>, T::View>, DatasetBase<ArrayView2<'a, F>, T::View>)

impl<'a, 'b: 'a, F, L: Label, T, D> DatasetBase<ArrayBase<D, Ix2>, T> where
D: Data<Elem = F>,
T: AsSingleTargets<Elem = L> + Labels<Elem = L>,

pub fn one_vs_all(
&self
) -> Result<Vec<(L, DatasetBase<ArrayView2<'_, F>, CountedTargets<bool, Array1<bool>>>)>>

impl<'b, F: Clone, E: Copy + 'b, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where
D: Data<Elem = F>,
T: FromTargetArray<'b, Elem = E>,
T::Owned: AsTargets,

pub fn bootstrap<R: Rng>(
&'b self,
sample_feature_size: (usize, usize ),
rng: &'b mut R
) -> impl Iterator<Item = DatasetBase<Array2<F>, <T as FromTargetArray<'b>>::Owned>> + 'b

pub fn bootstrap_samples<R: Rng>(
&'b self,
num_samples: usize,
rng: &'b mut R
) -> impl Iterator<Item = DatasetBase<Array2<F>, <T as FromTargetArray<'b>>::Owned>> + 'b

pub fn bootstrap_features<R: Rng>(
&'b self,
num_features: usize,
rng: &'b mut R
) -> impl Iterator<Item = DatasetBase<Array2<F>, <T as FromTargetArray<'b>>::Owned>> + 'b

pub fn fold(
&self,
k: usize
) -> Vec<(DatasetBase<Array2<F>, T::Owned>, DatasetBase<Array2<F>, T::Owned>)>

pub fn sample_chunks<'a: 'b>(
&'b self,
chunk_size: usize
) -> ChunksIter<'b, 'a, F, T>

impl<'a, F: 'a + Clone, E: Copy + 'a, D, S, I: TargetDim> DatasetBase<ArrayBase<D, Ix2>, ArrayBase<S, I>> where
D: DataMut<Elem = F>,
S: DataMut<Elem = E>,

pub fn iter_fold<O, C: Fn(&DatasetView<'_, F, E, I>) -> O>(
&'a mut self,
k: usize,
fit_closure: C
) -> impl Iterator<Item = (O, DatasetBase<ArrayView2<'_, F>, ArrayView<'_, E, I>>)>

impl<'a, F: 'a + Clone, E: Copy + 'a, D, S> DatasetBase<ArrayBase<D, Ix2>, ArrayBase<S, Ix1>> where
D: DataMut<Elem = F>,
S: DataMut<Elem = E>,

impl<F, E, I: TargetDim> DatasetBase<ArrayBase<OwnedRepr<D>, Dim<[usize ; 2]>>, ArrayBase<OwnedRepr<T>, I>>

impl<F: Copy, L: Copy + Label, D, T> DatasetBase<ArrayBase<D, Ix2>, T> where
D: Data<Elem = F>,
T: AsTargets<Elem = L>,

pub fn with_labels(
&self,
labels: &[L]
) -> DatasetBase<Array2<F>, CountedTargets<L, Array<L, T::Ix>>>

impl<R: Clone, T: Clone> Clone for DatasetBase<R, T> where
R: Records,

impl<R: Debug, T: Debug> Debug for DatasetBase<R, T> where
R: Records,

impl<F, E, D, S, I: TargetDim> From<(ArrayBase<D, Dim<[usize ; 2]>>, ArrayBase<S, I>)> for DatasetBase<ArrayBase<D, Ix2>, ArrayBase<S, I>> where
D: Data<Elem = F>,
S: Data<Elem = E>,

impl<R: PartialEq, T: PartialEq> PartialEq<DatasetBase<R, T>> for DatasetBase<R, T> where
R: Records,

impl<L: Label, R, R2, T, T2> ToConfusionMatrix<L, &'_ DatasetBase<R, T>> for DatasetBase<R2, T2> where
R: Records,
R2: Records,
T: AsSingleTargets<Elem = L>,
T2: AsSingleTargets<Elem = L> + Labels<Elem = L>,

fn confusion_matrix(
&self,
ground_truth: &DatasetBase<R, T>
) -> Result<ConfusionMatrix<L>>

fn confusion_matrix(
&self,
ground_truth: &DatasetBase<R, T>
) -> Result<ConfusionMatrix<L>>

impl<R, T> StructuralPartialEq for DatasetBase<R, T> where
R: Records,

impl<R, T> RefUnwindSafe for DatasetBase<R, T> where
R: RefUnwindSafe,
T: RefUnwindSafe,

impl<R, T> Send for DatasetBase<R, T> where
R: Send,
T: Send,