Struct ProjectionExprs

Source

pub struct ProjectionExprs { /* private fields */ }

Expand description

A collection of ProjectionExpr instances, representing a complete projection operation.

Projection operations are used in query plans to select specific columns or compute new columns based on existing ones.

See ProjectionExprs::from_indices to select a subset of columns by indices.

Implementations§

Source §

impl ProjectionExprs

Source

pub fn new(exprs: I) -> Self
where I: IntoIterator<Item = ProjectionExpr>,

Source

pub fn from_indices(indices: &[usize], schema: &Schema) -> Self

Creates a ProjectionExpr from a list of column indices.

This is a convenience method for creating simple column-only projections, where each projection expression is a reference to a column in the input schema.

§Behavior

Ordering: the output projection preserves the exact order of indices provided in the input slice For example, [2, 0, 1] will produce projections for columns 2, 0, then 1 in that order
Duplicates: Duplicate indices are allowed and will create multiple projection expressions referencing the same source column For example, [0, 0] creates 2 separate projections both referencing column 0

§Panics

Panics if any index in indices is out of bounds for the provided schema.

§Example

use arrow::datatypes::{DataType, Field, Schema};
use datafusion_physical_expr::projection::ProjectionExprs;
use std::sync::Arc;

// Create a schema with three columns
let schema = Arc::new(Schema::new(vec![
    Field::new("a", DataType::Int32, false),
    Field::new("b", DataType::Utf8, false),
    Field::new("c", DataType::Float64, false),
]));

// Project columns at indices 2 and 0 (c and a) - ordering is preserved
let projection = ProjectionExprs::from_indices(&[2, 0], &schema);

// This creates: SELECT c@2 AS c, a@0 AS a
assert_eq!(projection.as_ref().len(), 2);
assert_eq!(projection.as_ref()[0].alias, "c");
assert_eq!(projection.as_ref()[1].alias, "a");

// Duplicate indices are allowed
let projection_with_dups = ProjectionExprs::from_indices(&[0, 0, 1], &schema);
assert_eq!(projection_with_dups.as_ref().len(), 3);
assert_eq!(projection_with_dups.as_ref()[0].alias, "a");
assert_eq!(projection_with_dups.as_ref()[1].alias, "a"); // duplicate
assert_eq!(projection_with_dups.as_ref()[2].alias, "b");

Source

pub fn iter(&self) -> impl Iterator<Item = &ProjectionExpr>

Returns an iterator over the projection expressions

Source

pub fn projection_mapping( &self, input_schema: &SchemaRef, ) -> Result<ProjectionMapping>

Creates a ProjectionMapping from this projection

Source

pub fn expr_iter(&self) -> impl Iterator<Item = Arc<dyn PhysicalExpr>> + '_

Iterate over a clone of the projection expressions.

Source

pub fn try_map_exprs<F>(self, f: F) -> Result<Self>
where F: FnMut(Arc<dyn PhysicalExpr>) -> Result<Arc<dyn PhysicalExpr>>,

Apply a fallible transformation to the PhysicalExpr of each projection.

This method transforms the expression in each ProjectionExpr while preserving the alias. This is useful for rewriting expressions, such as when adapting expressions to a different schema.

§Example

use std::sync::Arc;
use arrow::datatypes::{DataType, Field, Schema};
use datafusion_common::Result;
use datafusion_physical_expr::expressions::Column;
use datafusion_physical_expr::projection::ProjectionExprs;
use datafusion_physical_expr::PhysicalExpr;

// Create a schema and projection
let schema = Arc::new(Schema::new(vec![
    Field::new("a", DataType::Int32, false),
    Field::new("b", DataType::Int32, false),
]));
let projection = ProjectionExprs::from_indices(&[0, 1], &schema);

// Transform each expression (this example just clones them)
let transformed = projection.try_map_exprs(|expr| Ok(expr))?;
assert_eq!(transformed.as_ref().len(), 2);

Source

pub fn try_merge(&self, other: &ProjectionExprs) -> Result<ProjectionExprs>

Apply another projection on top of this projection, returning the combined projection. For example, if this projection is SELECT c@2 AS x, b@1 AS y, a@0 as z and the other projection is SELECT x@0 + 1 AS c1, y@1 + z@2 as c2, we return a projection equivalent to SELECT c@2 + 1 AS c1, b@1 + a@0 as c2.

§Example

use datafusion_common::{Result, ScalarValue};
use datafusion_expr::Operator;
use datafusion_physical_expr::expressions::{BinaryExpr, Column, Literal};
use datafusion_physical_expr::projection::{ProjectionExpr, ProjectionExprs};
use std::sync::Arc;

fn main() -> Result<()> {
    // Example from the docstring:
    // Base projection: SELECT c@2 AS x, b@1 AS y, a@0 AS z
    let base = ProjectionExprs::new(vec![
        ProjectionExpr {
            expr: Arc::new(Column::new("c", 2)),
            alias: "x".to_string(),
        },
        ProjectionExpr {
            expr: Arc::new(Column::new("b", 1)),
            alias: "y".to_string(),
        },
        ProjectionExpr {
            expr: Arc::new(Column::new("a", 0)),
            alias: "z".to_string(),
        },
    ]);

    // Top projection: SELECT x@0 + 1 AS c1, y@1 + z@2 AS c2
    let top = ProjectionExprs::new(vec![
        ProjectionExpr {
            expr: Arc::new(BinaryExpr::new(
                Arc::new(Column::new("x", 0)),
                Operator::Plus,
                Arc::new(Literal::new(ScalarValue::Int32(Some(1)))),
            )),
            alias: "c1".to_string(),
        },
        ProjectionExpr {
            expr: Arc::new(BinaryExpr::new(
                Arc::new(Column::new("y", 1)),
                Operator::Plus,
                Arc::new(Column::new("z", 2)),
            )),
            alias: "c2".to_string(),
        },
    ]);

    // Expected result: SELECT c@2 + 1 AS c1, b@1 + a@0 AS c2
    let result = base.try_merge(&top)?;

    assert_eq!(result.as_ref().len(), 2);
    assert_eq!(result.as_ref()[0].alias, "c1");
    assert_eq!(result.as_ref()[1].alias, "c2");

    Ok(())
}

§Errors

This function returns an error if any expression in the other projection cannot be applied on top of this projection.

Source

pub fn column_indices(&self) -> Vec<usize>

Extract the column indices used in this projection. For example, for a projection SELECT a AS x, b + 1 AS y, where a is at index 0 and b is at index 1, this function would return [0, 1]. Repeated indices are returned only once, and the order is ascending.

Source

pub fn ordered_column_indices(&self) -> Vec<usize>

👎Deprecated since 52.0.0: Use column_indices() instead. This method will be removed in 58.0.0 or 6 months after 52.0.0 is released, whichever comes first.

Extract the ordered column indices for a column-only projection.

This function assumes that all expressions in the projection are simple column references. It returns the column indices in the order they appear in the projection.

§Panics

Panics if any expression in the projection is not a simple column reference. This includes:

Computed expressions (e.g., a + 1, CAST(a AS INT))
Function calls (e.g., UPPER(name), SUM(amount))
Literals (e.g., 42, 'hello')
Complex nested expressions (e.g., CASE WHEN ... THEN ... END)

§Returns

A vector of column indices in projection order. Unlike column_indices(), this function:

Preserves the projection order (does not sort)
Preserves duplicates (does not deduplicate)

§Example

For a projection SELECT c, a, c where a is at index 0 and c is at index 2, this function would return [2, 0, 2].

Use column_indices() instead if the projection may contain non-column expressions or if you need a deduplicated sorted list.

§Panics

Panics if any expression in the projection is not a simple column reference.

Source

pub fn project_schema(&self, input_schema: &Schema) -> Result<Schema>

Project a schema according to this projection. For example, for a projection SELECT a AS x, b + 1 AS y, where a is at index 0 and b is at index 1, if the input schema is [a: Int32, b: Int32, c: Int32], the output schema would be [x: Int32, y: Int32]. Fields’ metadata are preserved from the input schema.

Source

pub fn make_projector(&self, input_schema: &Schema) -> Result<Projector>

Create a new Projector from this projection and an input schema.

A Projector can be used to apply this projection to record batches.

§Errors

This function returns an error if the output schema cannot be constructed from the input schema with the given projection expressions. For example, if an expression only works with integer columns but the input schema has a string column at that index.

Source

pub fn create_expression_metrics( &self, metrics: &ExecutionPlanMetricsSet, partition: usize, ) -> ExpressionEvaluatorMetrics

Source

pub fn project_statistics( &self, stats: Statistics, output_schema: &Schema, ) -> Result<Statistics>

Project statistics according to this projection. For example, for a projection SELECT a AS x, b + 1 AS y, where a is at index 0 and b is at index 1, if the input statistics has column statistics for columns a, b, and c, the output statistics would have column statistics for columns x and y.

§Example

use arrow::datatypes::{DataType, Field, Schema};
use datafusion_common::stats::{ColumnStatistics, Precision, Statistics};
use datafusion_physical_expr::projection::ProjectionExprs;
use datafusion_common::Result;
use datafusion_common::ScalarValue;
use std::sync::Arc;

fn main() -> Result<()> {
    // Input schema: a: Int32, b: Int32, c: Int32
    let input_schema = Arc::new(Schema::new(vec![
        Field::new("a", DataType::Int32, false),
        Field::new("b", DataType::Int32, false),
        Field::new("c", DataType::Int32, false),
    ]));

    // Input statistics with column stats for a, b, c
    let input_stats = Statistics {
        num_rows: Precision::Exact(100),
        total_byte_size: Precision::Exact(1200),
        column_statistics: vec![
            // Column a stats
            ColumnStatistics::new_unknown()
                .with_null_count(Precision::Exact(0))
                .with_min_value(Precision::Exact(ScalarValue::Int32(Some(0))))
                .with_max_value(Precision::Exact(ScalarValue::Int32(Some(100))))
                .with_distinct_count(Precision::Exact(100)),
            // Column b stats
            ColumnStatistics::new_unknown()
                .with_null_count(Precision::Exact(0))
                .with_min_value(Precision::Exact(ScalarValue::Int32(Some(10))))
                .with_max_value(Precision::Exact(ScalarValue::Int32(Some(60))))
                .with_distinct_count(Precision::Exact(50)),
            // Column c stats
            ColumnStatistics::new_unknown()
                .with_null_count(Precision::Exact(5))
                .with_min_value(Precision::Exact(ScalarValue::Int32(Some(-10))))
                .with_max_value(Precision::Exact(ScalarValue::Int32(Some(200))))
                .with_distinct_count(Precision::Exact(25)),
        ],
    };

    // Create a projection that selects columns c and a (indices 2 and 0)
    let projection = ProjectionExprs::from_indices(&[2, 0], &input_schema);

    // Compute output schema
    let output_schema = projection.project_schema(&input_schema)?;

    // Project the statistics
    let output_stats = projection.project_statistics(input_stats, &output_schema)?;

    // The output should have 2 column statistics (for c and a, in that order)
    assert_eq!(output_stats.column_statistics.len(), 2);

    // First column in output is c (was at index 2)
    assert_eq!(
        output_stats.column_statistics[0].min_value,
        Precision::Exact(ScalarValue::Int32(Some(-10)))
    );
    assert_eq!(
        output_stats.column_statistics[0].null_count,
        Precision::Exact(5)
    );

    // Second column in output is a (was at index 0)
    assert_eq!(
        output_stats.column_statistics[1].min_value,
        Precision::Exact(ScalarValue::Int32(Some(0)))
    );
    assert_eq!(
        output_stats.column_statistics[1].distinct_count,
        Precision::Exact(100)
    );

    // Total byte size is recalculated based on projected columns
    assert_eq!(
        output_stats.total_byte_size,
        Precision::Exact(800), // each Int32 column is 4 bytes * 100 rows * 2 columns
    );

    // Number of rows remains the same
    assert_eq!(output_stats.num_rows, Precision::Exact(100));

    Ok(())
}

Trait Implementations§

Source §

impl AsRef<[ProjectionExpr]> for ProjectionExprs

Source §

fn as_ref(&self) -> &[ProjectionExpr]

Converts this type into a shared reference of the (usually inferred) input type.

Source §

impl Clone for ProjectionExprs

Source §

fn clone(&self) -> ProjectionExprs

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for ProjectionExprs

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl Display for ProjectionExprs

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl From<&[ProjectionExpr]> for ProjectionExprs

Source §

fn from(value: &[ProjectionExpr]) -> Self

Converts to this type from the input type.

Source §

impl From<Vec<ProjectionExpr>> for ProjectionExprs

Source §

fn from(value: Vec<ProjectionExpr>) -> Self

Converts to this type from the input type.

Source §

impl FromIterator<ProjectionExpr> for ProjectionExprs

Source §

fn from_iter<T: IntoIterator<Item = ProjectionExpr>>(exprs: T) -> Self

Creates a value from an iterator. Read more

Source §

impl<'a> IntoIterator for &'a ProjectionExprs

Source §

type Item = &'a ProjectionExpr

The type of the elements being iterated over.

Source §

type IntoIter = Iter<'a, ProjectionExpr>

Which kind of iterator are we turning this into?

Source §

fn into_iter(self) -> Self::IntoIter

Creates an iterator from a value. Read more

Source §

impl IntoIterator for ProjectionExprs

Source §

type Item = ProjectionExpr

The type of the elements being iterated over.

Source §

type IntoIter = IntoIter<ProjectionExpr>

Which kind of iterator are we turning this into?

Source §

fn into_iter(self) -> Self::IntoIter

Creates an iterator from a value. Read more

Source §

impl PartialEq for ProjectionExprs

Source §

fn eq(&self, other: &ProjectionExprs) -> bool

Tests for self and other values to be equal, and is used by ==.

1.0.0 · Source§

fn ne(&self, other: &Rhs) -> bool

Tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.

Source §

impl Eq for ProjectionExprs

Source §

impl StructuralPartialEq for ProjectionExprs

Auto Trait Implementations§

§

impl !UnwindSafe for ProjectionExprs

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> DynEq for T
where T: Eq + Any,

Source §

fn dyn_eq(&self, other: &(dyn Any + 'static)) -> bool

Source §

impl<Q, K> Equivalent<K> for Q
where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

Source §

fn equivalent(&self, key: &K) -> bool

Compare self to key and return true if they are equal.

Source §

impl<Q, K> Equivalent<K> for Q
where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

Source §

fn equivalent(&self, key: &K) -> bool

Checks if this value is equivalent to the given key. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T> ToString for T
where T: Display + ?Sized,

Source §

fn to_string(&self) -> String

Converts the given value to a String. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

ProjectionExprs

Struct ProjectionExprs Copy item path

Implementations§

impl ProjectionExprs

pub fn new<I>(exprs: I) -> Selfwhere I: IntoIterator<Item = ProjectionExpr>,

pub fn from_indices(indices: &[usize], schema: &Schema) -> Self

§Behavior

§Panics

§Example

pub fn iter(&self) -> impl Iterator<Item = &ProjectionExpr>

pub fn projection_mapping( &self, input_schema: &SchemaRef, ) -> Result<ProjectionMapping>

pub fn expr_iter(&self) -> impl Iterator<Item = Arc<dyn PhysicalExpr>> + '_

pub fn try_map_exprs<F>(self, f: F) -> Result<Self>where F: FnMut(Arc<dyn PhysicalExpr>) -> Result<Arc<dyn PhysicalExpr>>,

§Example

pub fn try_merge(&self, other: &ProjectionExprs) -> Result<ProjectionExprs>

§Example

§Errors

pub fn column_indices(&self) -> Vec<usize>

pub fn ordered_column_indices(&self) -> Vec<usize>

§Panics

§Returns

§Example

§Panics

pub fn project_schema(&self, input_schema: &Schema) -> Result<Schema>

pub fn make_projector(&self, input_schema: &Schema) -> Result<Projector>

§Errors

pub fn create_expression_metrics( &self, metrics: &ExecutionPlanMetricsSet, partition: usize, ) -> ExpressionEvaluatorMetrics

pub fn project_statistics( &self, stats: Statistics, output_schema: &Schema, ) -> Result<Statistics>

§Example

Trait Implementations§

impl AsRef<[ProjectionExpr]> for ProjectionExprs

fn as_ref(&self) -> &[ProjectionExpr]

impl Clone for ProjectionExprs

fn clone(&self) -> ProjectionExprs

fn clone_from(&mut self, source: &Self)

impl Debug for ProjectionExprs

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Display for ProjectionExprs

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl From<&[ProjectionExpr]> for ProjectionExprs

fn from(value: &[ProjectionExpr]) -> Self

impl From<Vec<ProjectionExpr>> for ProjectionExprs

fn from(value: Vec<ProjectionExpr>) -> Self

impl FromIterator<ProjectionExpr> for ProjectionExprs

fn from_iter<T: IntoIterator<Item = ProjectionExpr>>(exprs: T) -> Self

impl<'a> IntoIterator for &'a ProjectionExprs

type Item = &'a ProjectionExpr

type IntoIter = Iter<'a, ProjectionExpr>

fn into_iter(self) -> Self::IntoIter

impl IntoIterator for ProjectionExprs

type Item = ProjectionExpr

type IntoIter = IntoIter<ProjectionExpr>

fn into_iter(self) -> Self::IntoIter

impl PartialEq for ProjectionExprs

fn eq(&self, other: &ProjectionExprs) -> bool

fn ne(&self, other: &Rhs) -> bool

impl Eq for ProjectionExprs

impl StructuralPartialEq for ProjectionExprs

Auto Trait Implementations§

impl Freeze for ProjectionExprs

impl !RefUnwindSafe for ProjectionExprs

impl Send for ProjectionExprs

impl Sync for ProjectionExprs

impl Unpin for ProjectionExprs

impl !UnwindSafe for ProjectionExprs

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DynEq for Twhere T: Eq + Any,

fn dyn_eq(&self, other: &(dyn Any + 'static)) -> bool

impl<Q, K> Equivalent<K> for Qwhere Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

fn equivalent(&self, key: &K) -> bool

impl<Q, K> Equivalent<K> for Qwhere Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

fn equivalent(&self, key: &K) -> bool

Struct ProjectionExprs

pub fn new<I>(exprs: I) -> Self
where I: IntoIterator<Item = ProjectionExpr>,

pub fn try_map_exprs<F>(self, f: F) -> Result<Self>
where F: FnMut(Arc<dyn PhysicalExpr>) -> Result<Arc<dyn PhysicalExpr>>,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DynEq for T
where T: Eq + Any,

impl<Q, K> Equivalent<K> for Q
where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

impl<Q, K> Equivalent<K> for Q
where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> ToOwned for T
where T: Clone,

impl<T> ToString for T
where T: Display + ?Sized,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,