pub struct DataFrame { /* private fields */ }Expand description
An eager table backed by one or more Arrow RecordBatch values.
Implementations§
Source§impl DataFrame
impl DataFrame
Sourcepub fn new(columns: Vec<Series>) -> Result<DataFrame, DataFrameError>
pub fn new(columns: Vec<Series>) -> Result<DataFrame, DataFrameError>
Construct a DataFrame from a list of Series.
Chunk boundaries do not need to align across series as long as total lengths match.
Sourcepub fn from_batches(
batches: Vec<RecordBatch>,
) -> Result<DataFrame, DataFrameError>
pub fn from_batches( batches: Vec<RecordBatch>, ) -> Result<DataFrame, DataFrameError>
Construct a DataFrame from Arrow record batches (all batches must share the same schema).
Sourcepub fn from_series(series: Vec<Series>) -> Result<DataFrame, DataFrameError>
pub fn from_series(series: Vec<Series>) -> Result<DataFrame, DataFrameError>
Alias for DataFrame::new.
Sourcepub fn column(&self, name: &str) -> Result<Series, DataFrameError>
pub fn column(&self, name: &str) -> Result<Series, DataFrameError>
Get a column by name (case-sensitive).
Sourcepub fn to_arrow(&self) -> Vec<RecordBatch>
pub fn to_arrow(&self) -> Vec<RecordBatch>
Return the underlying Arrow batches.
Sourcepub fn lazy(&self) -> LazyFrame
pub fn lazy(&self) -> LazyFrame
Convert this eager DataFrame to a LazyFrame for query planning/execution.
Sourcepub fn select(&self, exprs: Vec<Expr>) -> Result<DataFrame, DataFrameError>
pub fn select(&self, exprs: Vec<Expr>) -> Result<DataFrame, DataFrameError>
Eager select, implemented by delegating to LazyFrame.
Sourcepub fn filter(&self, predicate: Expr) -> Result<DataFrame, DataFrameError>
pub fn filter(&self, predicate: Expr) -> Result<DataFrame, DataFrameError>
Eager filter, implemented by delegating to LazyFrame.
Sourcepub fn with_columns(
&self,
exprs: Vec<Expr>,
) -> Result<DataFrame, DataFrameError>
pub fn with_columns( &self, exprs: Vec<Expr>, ) -> Result<DataFrame, DataFrameError>
Eager with_columns, implemented by delegating to LazyFrame.
Sourcepub fn join<K>(
&self,
other: &DataFrame,
keys: K,
how: JoinType,
) -> Result<DataFrame, DataFrameError>
pub fn join<K>( &self, other: &DataFrame, keys: K, how: JoinType, ) -> Result<DataFrame, DataFrameError>
Join with another DataFrame using provided join keys.
Sourcepub fn sort(
&self,
by: Vec<String>,
descending: Vec<bool>,
) -> Result<DataFrame, DataFrameError>
pub fn sort( &self, by: Vec<String>, descending: Vec<bool>, ) -> Result<DataFrame, DataFrameError>
Sort by one or more columns.
Sourcepub fn unique(
&self,
subset: Option<Vec<String>>,
) -> Result<DataFrame, DataFrameError>
pub fn unique( &self, subset: Option<Vec<String>>, ) -> Result<DataFrame, DataFrameError>
Remove duplicate rows.
Sourcepub fn fill_null<T>(&self, fill: T) -> Result<DataFrame, DataFrameError>
pub fn fill_null<T>(&self, fill: T) -> Result<DataFrame, DataFrameError>
Fill null values using a scalar or strategy.
Sourcepub fn drop_nulls(
&self,
subset: Option<Vec<String>>,
) -> Result<DataFrame, DataFrameError>
pub fn drop_nulls( &self, subset: Option<Vec<String>>, ) -> Result<DataFrame, DataFrameError>
Drop rows containing null values.
Sourcepub fn null_count(&self) -> Result<DataFrame, DataFrameError>
pub fn null_count(&self) -> Result<DataFrame, DataFrameError>
Count null values per column.