Struct datafusion::datasource::listing::ListingOptions

source ·

pub struct ListingOptions {
    pub file_extension: String,
    pub format: Arc<dyn FileFormat>,
    pub table_partition_cols: Vec<(String, DataType)>,
    pub collect_stat: bool,
    pub target_partitions: usize,
    pub file_sort_order: Vec<Vec<Expr>>,
}

Expand description

Options for creating a ListingTable

Fields§

§file_extension: String

A suffix on which files should be filtered (leave empty to keep all files on the path)

§format: Arc<dyn FileFormat>

The file format

§table_partition_cols: Vec<(String, DataType)>

The expected partition column names in the folder structure. See Self::with_table_partition_cols for details

§collect_stat: bool

Set true to try to guess statistics from the files. This can add a lot of overhead as it will usually require files to be opened and at least partially parsed.

§target_partitions: usize

Group files to avoid that the number of partitions exceeds this limit

§file_sort_order: Vec<Vec<Expr>>

Optional pre-known sort order(s). Must be SortExprs.

DataFusion may take advantage of this ordering to omit sorts or use more efficient algorithms. Currently sortedness must be provided if it is known by some external mechanism, but may in the future be automatically determined, for example using parquet metadata.

See https://github.com/apache/datafusion/issues/4177 NOTE: This attribute stores all equivalent orderings (the outer Vec) where each ordering consists of an individual lexicographic ordering (encapsulated by a Vec<Expr>). If there aren’t multiple equivalent orderings, the outer Vec will have a single element.

Struct datafusion::datasource::listing::ListingOptionsCopy item path

Fields§

Implementations§

impl ListingOptions

pub fn new(format: Arc<dyn FileFormat>) -> Self

pub fn with_file_extension(self, file_extension: impl Into<String>) -> Self

pub fn with_table_partition_cols( self, table_partition_cols: Vec<(String, DataType)> ) -> Self

§Notes

§Example

pub fn with_collect_stat(self, collect_stat: bool) -> Self

pub fn with_target_partitions(self, target_partitions: usize) -> Self

pub fn with_file_sort_order(self, file_sort_order: Vec<Vec<Expr>>) -> Self

pub async fn infer_schema<'a>( &'a self, state: &SessionState, table_path: &'a ListingTableUrl ) -> Result<SchemaRef>

pub async fn validate_partitions( &self, state: &SessionState, table_path: &ListingTableUrl ) -> Result<()>

Trait Implementations§

impl Clone for ListingOptions

fn clone(&self) -> ListingOptions

fn clone_from(&mut self, source: &Self)

impl Debug for ListingOptions

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for ListingOptions

impl !RefUnwindSafe for ListingOptions

impl Send for ListingOptions

impl Sync for ListingOptions

impl Unpin for ListingOptions

impl !UnwindSafe for ListingOptions

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Same for T

type Output = T

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct datafusion::datasource::listing::ListingOptions

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,