Skip to main content

Dataset

Struct Dataset 

Source
pub struct Dataset {
    pub data: Array2<f64>,
    pub target: Option<Array1<f64>>,
    pub targetnames: Option<Vec<String>>,
    pub featurenames: Option<Vec<String>>,
    pub feature_descriptions: Option<Vec<String>>,
    pub description: Option<String>,
    pub metadata: HashMap<String, String>,
}
Expand description

Represents a dataset with features, optional targets, and metadata

The Dataset struct is the core data structure for managing machine learning datasets. It stores the feature matrix, optional target values, and rich metadata including feature names, descriptions, and arbitrary key-value pairs.

§Examples

use scirs2_core::ndarray::Array2;
use scirs2_datasets::utils::Dataset;

let data = Array2::from_shape_vec((3, 2), vec![1.0, 2.0, 3.0, 4.0, 5.0, 6.0]).expect("Operation failed");
let dataset = Dataset::new(data, None)
    .with_featurenames(vec!["feature1".to_string(), "feature2".to_string()])
    .with_description("Sample dataset".to_string());

assert_eq!(dataset.n_samples(), 3);
assert_eq!(dataset.n_features(), 2);

Fields§

§data: Array2<f64>

Features/data matrix (n_samples, n_features)

§target: Option<Array1<f64>>

Optional target values

§targetnames: Option<Vec<String>>

Optional target names for classification problems

§featurenames: Option<Vec<String>>

Optional feature names

§feature_descriptions: Option<Vec<String>>

Optional descriptions for each feature

§description: Option<String>

Optional dataset description

§metadata: HashMap<String, String>

Optional dataset metadata

Implementations§

Source§

impl Dataset

Source

pub fn new(data: Array2<f64>, target: Option<Array1<f64>>) -> Self

Create a new dataset with the given data and target

§Arguments
  • data - The feature matrix (n_samples, n_features)
  • target - Optional target values (n_samples,)
§Returns

A new Dataset instance with empty metadata

§Examples
use scirs2_core::ndarray::{Array1, Array2};
use scirs2_datasets::utils::Dataset;

let data = Array2::zeros((100, 5));
let target = Some(Array1::zeros(100));
let dataset = Dataset::new(data, target);
Source

pub fn from_metadata( data: Array2<f64>, target: Option<Array1<f64>>, metadata: DatasetMetadata, ) -> Self

Create a new dataset with the given data, target, and metadata

§Arguments
  • data - The feature matrix (n_samples, n_features)
  • target - Optional target values (n_samples,)
  • metadata - Dataset metadata information
§Returns

A new Dataset instance with metadata applied

Source

pub fn with_targetnames(self, targetnames: Vec<String>) -> Self

Add target names to the dataset (builder pattern)

§Arguments
  • targetnames - Vector of target class names
§Returns

Self for method chaining

Source

pub fn with_featurenames(self, featurenames: Vec<String>) -> Self

Add feature names to the dataset (builder pattern)

§Arguments
  • featurenames - Vector of feature names
§Returns

Self for method chaining

Source

pub fn with_feature_descriptions(self, featuredescriptions: Vec<String>) -> Self

Add feature descriptions to the dataset (builder pattern)

§Arguments
  • feature_descriptions - Vector of feature descriptions
§Returns

Self for method chaining

Source

pub fn with_description(self, description: String) -> Self

Add a description to the dataset (builder pattern)

§Arguments
  • description - Dataset description
§Returns

Self for method chaining

Source

pub fn with_metadata(self, key: &str, value: &str) -> Self

Add metadata to the dataset (builder pattern)

§Arguments
  • key - Metadata key
  • value - Metadata value
§Returns

Self for method chaining

Source

pub fn n_samples(&self) -> usize

Get the number of samples in the dataset

§Returns

Number of samples (rows) in the dataset

Source

pub fn n_features(&self) -> usize

Get the number of features in the dataset

§Returns

Number of features (columns) in the dataset

Source

pub fn shape(&self) -> (usize, usize)

Get dataset shape as (n_samples, n_features)

§Returns

Tuple of (n_samples, n_features)

Source

pub fn has_target(&self) -> bool

Check if the dataset has target values

§Returns

True if target values are present, false otherwise

Source

pub fn featurenames(&self) -> Option<&Vec<String>>

Get a reference to the feature names if available

§Returns

Optional reference to feature names vector

Source

pub fn targetnames(&self) -> Option<&Vec<String>>

Get a reference to the target names if available

§Returns

Optional reference to target names vector

Source

pub fn description(&self) -> Option<&String>

Get a reference to the dataset description if available

§Returns

Optional reference to dataset description

Source

pub fn metadata(&self) -> &HashMap<String, String>

Get a reference to the metadata

§Returns

Reference to metadata HashMap

Source

pub fn set_metadata(&mut self, key: &str, value: &str)

Add or update a metadata entry

§Arguments
  • key - Metadata key
  • value - Metadata value
Source

pub fn get_metadata(&self, key: &str) -> Option<&String>

Get a metadata value by key

§Arguments
  • key - Metadata key to lookup
§Returns

Optional reference to the metadata value

Trait Implementations§

Source§

impl Clone for Dataset

Source§

fn clone(&self) -> Dataset

Returns a duplicate of the value. Read more
1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
Source§

impl Debug for Dataset

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
Source§

impl<'de> Deserialize<'de> for Dataset

Source§

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>
where __D: Deserializer<'de>,

Deserialize this value from the given Serde deserializer. Read more
Source§

impl Serialize for Dataset

Source§

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>
where __S: Serializer,

Serialize this value into the given Serde serializer. Read more

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> CloneToUninit for T
where T: Clone,

Source§

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dest. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T> Instrument for T

Source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
Source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T> PolicyExt for T
where T: ?Sized,

Source§

fn and<P, B, E>(self, other: P) -> And<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow only if self and other return Action::Follow. Read more
Source§

fn or<P, B, E>(self, other: P) -> Or<T, P>
where T: Policy<B, E>, P: Policy<B, E>,

Create a new Policy that returns Action::Follow if either self or other returns Action::Follow. Read more
Source§

impl<T> Same for T

Source§

type Output = T

Should always be Self
Source§

impl<SS, SP> SupersetOf<SS> for SP
where SS: SubsetOf<SP>,

Source§

fn to_subset(&self) -> Option<SS>

The inverse inclusion map: attempts to construct self from the equivalent element of its superset. Read more
Source§

fn is_in_subset(&self) -> bool

Checks if self is actually part of its subset T (and can be converted to it).
Source§

fn to_subset_unchecked(&self) -> SS

Use with care! Same as self.to_subset but without any property checks. Always succeeds.
Source§

fn from_subset(element: &SS) -> SP

The inclusion map: converts self to the equivalent element of its superset.
Source§

impl<T> ToOwned for T
where T: Clone,

Source§

type Owned = T

The resulting type after obtaining ownership.
Source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
Source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V

Source§

impl<T> WithSubscriber for T

Source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,