Struct polars::prelude::LazyFrame[−][src]

pub struct LazyFrame { /* fields omitted */ }

Expand description

Lazy abstraction over an eager DataFrame. It really is an abstraction over a logical plan. The methods of this struct will incrementally modify a logical plan until output is requested (via collect)

Implementations

[src]

impl LazyFrame

[src]

pub fn new_from_parquet(
    path: String, 
    stop_after_n_rows: Option<usize>, 
    cache: bool
) -> LazyFrame

Create a LazyFrame directly from a parquet scan.

[src]

pub fn to_dot(&self, optimized: bool) -> Result<String, PolarsError>

Get a dot language representation of the LogicalPlan.

[src]

pub fn with_projection_pushdown(self, toggle: bool) -> LazyFrame

Toggle projection pushdown optimization.

[src]

pub fn with_predicate_pushdown(self, toggle: bool) -> LazyFrame

Toggle predicate pushdown optimization.

[src]

pub fn with_type_coercion(self, toggle: bool) -> LazyFrame

Toggle type coercion optimization.

[src]

pub fn with_simplify_expr(self, toggle: bool) -> LazyFrame

Toggle expression simplification optimization on or off

[src]

pub fn with_aggregate_pushdown(self, toggle: bool) -> LazyFrame

Toggle aggregate pushdown.

[src]

pub fn with_string_cache(self, toggle: bool) -> LazyFrame

Toggle global string cache.

[src]

pub fn with_join_pruning(self, toggle: bool) -> LazyFrame

Toggle join pruning optimization

[src]

pub fn describe_plan(&self) -> String

Describe the logical plan.

[src]

pub fn describe_optimized_plan(&self) -> Result<String, PolarsError>

Describe the optimized logical plan.

[src]

pub fn sort(self, by_column: &str, reverse: bool) -> LazyFrame

Add a sort operation to the logical plan.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

/// Sort DataFrame by 'sepal.width' column
fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .sort("sepal.width", false)
}

[src]

pub fn sort_by_exprs(
    self, 
    by_exprs: Vec<Expr, Global>, 
    reverse: Vec<bool, Global>
) -> LazyFrame

Add a sort operation to the logical plan.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

/// Sort DataFrame by 'sepal.width' column
fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .sort_by_exprs(vec![col("sepal.width")], vec![false])
}

[src]

pub fn reverse(self) -> LazyFrame

Reverse the DataFrame

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .reverse()
}

[src]

pub fn with_column_renamed(
    self, 
    existing_name: &str, 
    new_name: &str
) -> LazyFrame

Rename a column in the DataFrame

[src]

pub fn shift(self, periods: i64) -> LazyFrame

Shift the values by a given period and fill the parts that will be empty due to this operation with Nones.

See the method on Series for more info on the shift operation.

[src]

pub fn shift_and_fill(self, periods: i64, fill_value: Expr) -> LazyFrame

Shift the values by a given period and fill the parts that will be empty due to this operation with the result of the fill_value expression.

See the method on Series for more info on the shift operation.

[src]

pub fn fill_none(self, fill_value: Expr) -> LazyFrame

Fill none values in the DataFrame

[src]

pub fn cache(self) -> LazyFrame

Caches the result into a new LazyFrame. This should be used to prevent computations running multiple times

[src]

pub fn fetch(self, n_rows: usize) -> Result<DataFrame, PolarsError>

Fetch is like a collect operation, but it overwrites the number of rows read by every scan operation. This is a utility that helps debug a query on a smaller number of rows.

Note that the fetch does not guarantee the final number of rows in the DataFrame. Filter, join operations and a lower number of rows available in the scanned file influence the final number of rows.

[src]

pub fn optimize(
    self, 
    lp_arena: &mut Arena<ALogicalPlan>, 
    expr_arena: &mut Arena<AExpr>
) -> Result<Node, PolarsError>

[src]

pub fn collect(self) -> Result<DataFrame, PolarsError>

Execute all the lazy operations and collect them into a DataFrame. Before execution the query is being optimized.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> Result<DataFrame> {
      df.lazy()
        .groupby(vec![col("foo")])
        .agg(vec!(col("bar").sum(),
                  col("ham").mean().alias("avg_ham")))
        .collect()
}

[src]

pub fn filter(self, predicate: Expr) -> LazyFrame

Filter by some predicate expression.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .filter(col("sepal.width").is_not_null())
        .select(&[col("sepal.width"), col("sepal.length")])
}

[src]

pub fn select<E>(self, exprs: E) -> LazyFrame where
    E: AsRef<[Expr]>,

Select (and rename) columns from the query.

Columns can be selected with col; If you want to select all columns use col("*").

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

/// This function selects column "foo" and column "bar".
/// Column "bar" is renamed to "ham".
fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
        .select(&[col("foo"),
                  col("bar").alias("ham")])
}

/// This function selects all columns except "foo"
fn exclude_a_column(df: DataFrame) -> LazyFrame {
      df.lazy()
        .select(&[col("*"),
                  except("foo")])
}

[src]

pub fn groupby(self, by: Vec<Expr, Global>) -> LazyGroupBy

Group by and aggregate.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(df: DataFrame) -> LazyFrame {
      df.lazy()
       .groupby(vec![col("date")])
       .agg(vec![
           col("rain").min(),
           col("rain").sum(),
           col("rain").quantile(0.5).alias("median_rain"),
       ])
       .sort("date", false)
}

[src]

pub fn left_join(
    self, 
    other: LazyFrame, 
    left_on: Expr, 
    right_on: Expr
) -> LazyFrame

Join query with other lazy query.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn join_dataframes(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .left_join(other, col("foo"), col("bar"))
}

[src]

pub fn outer_join(
    self, 
    other: LazyFrame, 
    left_on: Expr, 
    right_on: Expr
) -> LazyFrame

Join query with other lazy query.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn join_dataframes(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .outer_join(other, col("foo"), col("bar"))
}

[src]

pub fn inner_join(
    self, 
    other: LazyFrame, 
    left_on: Expr, 
    right_on: Expr
) -> LazyFrame

Join query with other lazy query.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn join_dataframes(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .inner_join(other, col("foo"), col("bar").cast(DataType::Utf8))
}

[src]

pub fn join(
    self, 
    other: LazyFrame, 
    left_on: Vec<Expr, Global>, 
    right_on: Vec<Expr, Global>, 
    how: JoinType
) -> LazyFrame

Generic join function that can join on multiple columns.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;

fn example(ldf: LazyFrame, other: LazyFrame) -> LazyFrame {
        ldf
        .join(other, vec![col("foo"), col("bar")], vec![col("foo"), col("bar")], JoinType::Inner)
}

[src]

pub fn join_builder(self) -> JoinBuilder

[src]

pub fn with_column(self, expr: Expr) -> LazyFrame

Add a column to a DataFrame

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn add_column(df: DataFrame) -> LazyFrame {
    df.lazy()
        .with_column(
            when(col("sepal.length").lt(lit(5.0)))
            .then(lit(10))
            .otherwise(lit(1))
            .alias("new_column_name"),
            )
}

[src]

pub fn with_columns(self, exprs: Vec<Expr, Global>) -> LazyFrame

Add multiple columns to a DataFrame.

Example

use polars_core::prelude::*;
use polars_lazy::prelude::*;
fn add_columns(df: DataFrame) -> LazyFrame {
    df.lazy()
        .with_columns(
            vec![lit(10).alias("foo"), lit(100).alias("bar")]
         )
}

[src]

pub fn max(self) -> LazyFrame

Aggregate all the columns as their maximum values.

[src]

pub fn min(self) -> LazyFrame

Aggregate all the columns as their minimum values.

[src]

pub fn sum(self) -> LazyFrame

Aggregate all the columns as their sum values.

[src]

pub fn mean(self) -> LazyFrame

Aggregate all the columns as their mean values.

[src]

pub fn median(self) -> LazyFrame

Aggregate all the columns as their median values.

[src]

pub fn quantile(self, quantile: f64) -> LazyFrame

Aggregate all the columns as their quantile values.

[src]

pub fn std(self) -> LazyFrame

Aggregate all the columns as their standard deviation values.

[src]

pub fn var(self) -> LazyFrame

Aggregate all the columns as their variance values.

[src]

pub fn explode(self, columns: &[Expr]) -> LazyFrame

Apply explode operation. See eager explode.

[src]

pub fn drop_duplicates(
    self, 
    maintain_order: bool, 
    subset: Option<Vec<String, Global>>
) -> LazyFrame

Drop duplicate rows. See eager.

[src]

pub fn drop_nulls(self, subset: Option<Vec<Expr, Global>>) -> LazyFrame

Drop null rows.

Equal to LazyFrame::filter(col("*").is_not_null())

[src]

pub fn slice(self, offset: i64, len: usize) -> LazyFrame

Slice the DataFrame.

[src]

pub fn first(self) -> LazyFrame

Get the first row.

[src]

pub fn last(self) -> LazyFrame

Get the last row

[src]

pub fn tail(self, n: usize) -> LazyFrame

Get the n last rows

[src]

pub fn melt(
    self, 
    id_vars: Vec<String, Global>, 
    value_vars: Vec<String, Global>
) -> LazyFrame

Melt the DataFrame from wide to long format

[src]

pub fn limit(self, n: usize) -> LazyFrame

Limit the DataFrame to the first n rows. Note if you don’t want the rows to be scanned, use fetch.

[src]

pub fn map<F>(
    self, 
    function: F, 
    optimizations: Option<OptState>, 
    schema: Option<Schema>
) -> LazyFrame where
    F: DataFrameUdf + 'static,

Apply a function/closure once the logical plan get executed.

Warning

This can blow up in your face if the schema is changed due to the operation. The optimizer relies on a correct schema.

You can toggle certain optimizations off.

Trait Implementations

[src]

impl Clone for LazyFrame

[src]

pub fn clone(&self) -> LazyFrame

Returns a copy of the value. Read more

1.0.0[src]

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

[src]

impl Default for LazyFrame

[src]

pub fn default() -> LazyFrame

Returns the “default value” for a type. Read more

[src]

impl From<LogicalPlan> for LazyFrame

[src]

pub fn from(plan: LogicalPlan) -> LazyFrame

Performs the conversion.

Auto Trait Implementations

impl !RefUnwindSafe for LazyFrame

impl Send for LazyFrame

impl Sync for LazyFrame

impl Unpin for LazyFrame

impl !UnwindSafe for LazyFrame

Blanket Implementations

[src]

impl<T> Any for T where
    T: 'static + ?Sized,

[src]

pub fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

[src]

impl<T> Borrow<T> for T where
    T: ?Sized,

[src]

pub fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

[src]

impl<T> BorrowMut<T> for T where
    T: ?Sized,

[src]

pub fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

[src]

impl<T> From<T> for T

[src]

pub fn from(t: T) -> T

Performs the conversion.

[src]

impl<T, U> Into<U> for T where
    U: From<T>,

[src]

pub fn into(self) -> U

Performs the conversion.

impl<T> Pointable for T

pub const ALIGN: usize

The alignment of pointer.

type Init = T

The type for initializers.

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

pub unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

[src]

impl<T> ToOwned for T where
    T: Clone,

type Owned = T

The resulting type after obtaining ownership.

[src]

pub fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

[src]

pub fn clone_into(&self, target: &mut T)

🔬 This is a nightly-only experimental API. (toowned_clone_into)

recently added

Uses borrowed data to replace owned data, usually by cloning. Read more

[src]

impl<T, U> TryFrom<U> for T where
    U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

[src]

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.

[src]

impl<T, U> TryInto<U> for T where
    U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.

[src]

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.

impl<V, T> VZip<V> for T where
    V: MultiLane<T>,

pub fn vzip(self) -> V