Struct polars_lazy::frame::LazyFrame[−][src]

pub struct LazyFrame { /* fields omitted */ }

Expand description

Lazy abstraction over an eager DataFrame. It really is an abstraction over a logical plan. The methods of this struct will incrementally modify a logical plan until output is requested (via collect)

Implementations

impl LazyFrame[src]

pub fn new_from_parquet(
    path: String, 
    stop_after_n_rows: Option<usize>, 
    cache: bool
) -> Self

[src]

Create a LazyFrame directly from a parquet scan.

pub fn to_dot(&self, optimized: bool) -> Result<String>[src]

Get a dot language representation of the LogicalPlan.

pub fn with_projection_pushdown(self, toggle: bool) -> Self[src]

Toggle projection pushdown optimization.

pub fn with_predicate_pushdown(self, toggle: bool) -> Self[src]

Toggle predicate pushdown optimization.

pub fn with_type_coercion(self, toggle: bool) -> Self[src]

Toggle type coercion optimization.

pub fn with_simplify_expr(self, toggle: bool) -> Self[src]

Toggle expression simplification optimization on or off

pub fn with_aggregate_pushdown(self, toggle: bool) -> Self[src]

Toggle aggregate pushdown.

pub fn with_string_cache(self, toggle: bool) -> Self[src]

Toggle global string cache.

pub fn with_join_pruning(self, toggle: bool) -> Self[src]

Toggle join pruning optimization

pub fn describe_plan(&self) -> String[src]

Describe the logical plan.

pub fn describe_optimized_plan(&self) -> Result<String>[src]

Describe the optimized logical plan.

pub fn sort(self, by_column: &str, reverse: bool) -> Self[src]

Add a sort operation to the logical plan.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

/// Sort DataFrame by 'sepal.width' column
fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .sort("sepal.width", false)
}

pub fn sort_by_exprs(self, by_exprs: Vec<Expr>, reverse: Vec<bool>) -> Self[src]

Add a sort operation to the logical plan.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

/// Sort DataFrame by 'sepal.width' column
fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .sort_by_exprs(vec![col("sepal.width")], vec![false])
}

pub fn reverse(self) -> Self[src]

Reverse the DataFrame

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .reverse()
}

pub fn with_column_renamed(self, existing_name: &str, new_name: &str) -> Self[src]

Rename a column in the DataFrame

pub fn shift(self, periods: i64) -> Self[src]

Shift the values by a given period and fill the parts that will be empty due to this operation with Nones.

See the method on Series for more info on the shift operation.

pub fn shift_and_fill(self, periods: i64, fill_value: Expr) -> Self[src]

Shift the values by a given period and fill the parts that will be empty due to this operation with the result of the fill_value expression.

See the method on Series for more info on the shift operation.

pub fn fill_none(self, fill_value: Expr) -> LazyFrame[src]

Fill none values in the DataFrame

pub fn cache(self) -> Self[src]

Caches the result into a new LazyFrame. This should be used to prevent computations running multiple times

pub fn fetch(self, n_rows: usize) -> Result<DataFrame>[src]

Fetch is like a collect operation, but it overwrites the number of rows read by every scan operation. This is a utility that helps debug a query on a smaller number of rows.

Note that the fetch does not guarantee the final number of rows in the DataFrame. Filter, join operations and a lower number of rows available in the scanned file influence the final number of rows.

pub fn optimize(
    self, 
    lp_arena: &mut Arena<ALogicalPlan>, 
    expr_arena: &mut Arena<AExpr>
) -> Result<Node>

[src]

pub fn collect(self) -> Result<DataFrame>[src]

Execute all the lazy operations and collect them into a DataFrame. Before execution the query is being optimized.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> Result<DataFrame> {
      df.lazy()
        .groupby(vec![col("foo")])
        .agg(vec!(col("bar").sum(),
                  col("ham").mean().alias("avg_ham")))
        .collect()
}

pub fn filter(self, predicate: Expr) -> Self[src]

Filter by some predicate expression.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .filter(col("sepal.width").is_not_null())
        .select(&[col("sepal.width"), col("sepal.length")])
}

pub fn select<E: AsRef<[Expr]>>(self, exprs: E) -> Self[src]

Select (and rename) columns from the query.

Columns can be selected with col; If you want to select all columns use col("*").

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

/// This function selects column "foo" and column "bar".
/// Column "bar" is renamed to "ham".
fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .select(&[col("foo"),
                  col("bar").alias("ham")])
}

/// This function selects all columns except "foo"
fn exclude_a_column(df: DataFrame) -> LazyFrame {
      df.lazy()
        .select(&[col("*"),
                  except("foo")])
}

pub fn groupby(self, by: Vec<Expr>) -> LazyGroupBy[src]

Group by and aggregate.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
       .groupby(vec![col("date")])
       .agg(vec![
           col("rain").min(),
           col("rain").sum(),
           col("rain").quantile(0.5).alias("median_rain"),
       ])
       .sort("date", false)
}

pub fn left_join(
    self, 
    other: LazyFrame, 
    left_on: Expr, 
    right_on: Expr
) -> LazyFrame

[src]

Join query with other lazy query.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn join_dataframes(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .left_join(other, col("foo"), col("bar"))
}

pub fn outer_join(
    self, 
    other: LazyFrame, 
    left_on: Expr, 
    right_on: Expr
) -> LazyFrame

[src]

Join query with other lazy query.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn join_dataframes(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .outer_join(other, col("foo"), col("bar"))
}

pub fn inner_join(
    self, 
    other: LazyFrame, 
    left_on: Expr, 
    right_on: Expr
) -> LazyFrame

[src]

Join query with other lazy query.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn join_dataframes(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .inner_join(other, col("foo"), col("bar").cast(DataType::Utf8))
}

pub fn join(
    self, 
    other: LazyFrame, 
    left_on: Vec<Expr>, 
    right_on: Vec<Expr>, 
    how: JoinType
) -> LazyFrame

[src]

Generic join function that can join on multiple columns.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .join(other, vec![col("foo"), col("bar")], vec![col("foo"), col("bar")], JoinType::Inner)
}

pub fn join_builder(self) -> JoinBuilder[src]

pub fn with_column(self, expr: Expr) -> LazyFrame[src]

Add a column to a DataFrame

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn add_column(df: DataFrame) -> LazyFrame {
    df.lazy()
        .with_column(
            when(col("sepal.length").lt(lit(5.0)))
            .then(lit(10))
            .otherwise(lit(1))
            .alias("new_column_name"),
            )
}

pub fn with_columns(self, exprs: Vec<Expr>) -> LazyFrame[src]

Add multiple columns to a DataFrame.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn add_columns(df: DataFrame) -> LazyFrame {
    df.lazy()
        .with_columns(
            vec![lit(10).alias("foo"), lit(100).alias("bar")]
         )
}

pub fn max(self) -> LazyFrame[src]

Aggregate all the columns as their maximum values.

pub fn min(self) -> LazyFrame[src]

Aggregate all the columns as their minimum values.

pub fn sum(self) -> LazyFrame[src]

Aggregate all the columns as their sum values.

pub fn mean(self) -> LazyFrame[src]

Aggregate all the columns as their mean values.

pub fn median(self) -> LazyFrame[src]

Aggregate all the columns as their median values.

pub fn quantile(self, quantile: f64) -> LazyFrame[src]

Aggregate all the columns as their quantile values.

pub fn std(self) -> LazyFrame[src]

Aggregate all the columns as their standard deviation values.

pub fn var(self) -> LazyFrame[src]

Aggregate all the columns as their variance values.

pub fn explode(self, columns: &[Expr]) -> LazyFrame[src]

Apply explode operation. See eager explode.

pub fn drop_duplicates(
    self, 
    maintain_order: bool, 
    subset: Option<Vec<String>>
) -> LazyFrame

[src]

Drop duplicate rows. See eager.

pub fn drop_nulls(self, subset: Option<Vec<Expr>>) -> LazyFrame[src]

Drop null rows.

Equal to LazyFrame::filter(col("*").is_not_null())

pub fn slice(self, offset: i64, len: usize) -> LazyFrame[src]

Slice the DataFrame.

pub fn first(self) -> LazyFrame[src]

Get the first row.

pub fn last(self) -> LazyFrame[src]

Get the last row

pub fn tail(self, n: usize) -> LazyFrame[src]

Get the n last rows

pub fn melt(self, id_vars: Vec<String>, value_vars: Vec<String>) -> LazyFrame[src]

Melt the DataFrame from wide to long format

pub fn limit(self, n: usize) -> LazyFrame[src]

Limit the DataFrame to the first n rows. Note if you don’t want the rows to be scanned, use fetch.

pub fn map<F>(
    self, 
    function: F, 
    optimizations: Option<AllowedOptimizations>, 
    schema: Option<Schema>
) -> LazyFrame where
    F: DataFrameUdf + 'static,

[src]

Apply a function/closure once the logical plan get executed.

Warning

This can blow up in your face if the schema is changed due to the operation. The optimizer relies on a correct schema.

You can toggle certain optimizations off.

Trait Implementations

impl Clone for LazyFrame[src]

fn clone(&self) -> LazyFrame[src]

Returns a copy of the value. Read more

fn clone_from(&mut self, source: &Self)1.0.0 [src]

Performs copy-assignment from source. Read more

impl Default for LazyFrame[src]

fn default() -> Self[src]

Returns the “default value” for a type. Read more

impl From<LogicalPlan> for LazyFrame[src]

fn from(plan: LogicalPlan) -> Self[src]

Performs the conversion.

Auto Trait Implementations

impl !RefUnwindSafe for LazyFrame

impl Send for LazyFrame

impl Sync for LazyFrame

impl Unpin for LazyFrame

impl !UnwindSafe for LazyFrame

Blanket Implementations

impl<T> Any for T where
    T: 'static + ?Sized,

[src]

pub fn type_id(&self) -> TypeId[src]

Gets the TypeId of self. Read more

impl<T> Borrow<T> for T where
    T: ?Sized,

[src]

pub fn borrow(&self) -> &T[src]

Immutably borrows from an owned value. Read more

impl<T> BorrowMut<T> for T where
    T: ?Sized,

[src]

pub fn borrow_mut(&mut self) -> &mut T[src]

Mutably borrows from an owned value. Read more

impl<T> From<T> for T[src]

pub fn from(t: T) -> T[src]

Performs the conversion.

impl<T, U> Into<U> for T where
    U: From<T>,

[src]

pub fn into(self) -> U[src]

Performs the conversion.

impl<T> Pointable for T

pub const ALIGN: usize

The alignment of pointer.

type Init = T

The type for initializers.

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

pub unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

impl<T> ToOwned for T where
    T: Clone,

[src]

type Owned = T

The resulting type after obtaining ownership.

pub fn to_owned(&self) -> T[src]

Creates owned data from borrowed data, usually by cloning. Read more

pub fn clone_into(&self, target: &mut T)[src]

🔬 This is a nightly-only experimental API. (toowned_clone_into)

recently added

Uses borrowed data to replace owned data, usually by cloning. Read more

impl<T, U> TryFrom<U> for T where
    U: Into<T>,

[src]

type Error = Infallible

The type returned in the event of a conversion error.

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>[src]

Performs the conversion.

impl<T, U> TryInto<U> for T where
    U: TryFrom<T>,

[src]

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>[src]

Performs the conversion.

impl<V, T> VZip<V> for T where
    V: MultiLane<T>,

pub fn vzip(self) -> V