Struct iceberg_rust::spec::manifest::DataFile
source · pub struct DataFile {Show 17 fields
pub content: Content,
pub file_path: String,
pub file_format: FileFormat,
pub partition: Struct,
pub record_count: i64,
pub file_size_in_bytes: i64,
pub column_sizes: Option<AvroMap<i64>>,
pub value_counts: Option<AvroMap<i64>>,
pub null_value_counts: Option<AvroMap<i64>>,
pub nan_value_counts: Option<AvroMap<i64>>,
pub distinct_counts: Option<AvroMap<i64>>,
pub lower_bounds: Option<HashMap<i32, Value>>,
pub upper_bounds: Option<HashMap<i32, Value>>,
pub key_metadata: Option<ByteBuf>,
pub split_offsets: Option<Vec<i64>>,
pub equality_ids: Option<Vec<i32>>,
pub sort_order_id: Option<i32>,
}
Expand description
DataFile found in Manifest.
Fields§
§content: Content
Type of content in data file.
file_path: String
Full URI for the file with a FS scheme.
file_format: FileFormat
String file format name, avro, orc or parquet
partition: Struct
Partition data tuple, schema based on the partition spec output using partition field ids for the struct field ids
record_count: i64
Number of records in this file
file_size_in_bytes: i64
Total file size in bytes
column_sizes: Option<AvroMap<i64>>
Map from column id to total size on disk
value_counts: Option<AvroMap<i64>>
Map from column id to number of values in the column (including null and NaN values)
null_value_counts: Option<AvroMap<i64>>
Map from column id to number of null values
nan_value_counts: Option<AvroMap<i64>>
Map from column id to number of NaN values
distinct_counts: Option<AvroMap<i64>>
Map from column id to number of distinct values in the column.
lower_bounds: Option<HashMap<i32, Value>>
Map from column id to lower bound in the column
upper_bounds: Option<HashMap<i32, Value>>
Map from column id to upper bound in the column
key_metadata: Option<ByteBuf>
Implementation specific key metadata for encryption
split_offsets: Option<Vec<i64>>
Split offsets for the data file.
equality_ids: Option<Vec<i32>>
Field ids used to determine row equality in equality delete files.
sort_order_id: Option<i32>
ID representing sort order for this file