[package]
edition = "2024"
rust-version = "1.85"
name = "rust-data-processing"
version = "0.1.5"
build = false
exclude = [
"Planning/",
"python-wrapper/",
"docs/python/",
"docs/landing/",
"README.md",
"test_run.log",
".github/",
"scripts/",
]
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Schema-first ingestion (CSV, JSON, Parquet, Excel) into an in-memory DataSet, plus Polars-backed pipelines, SQL, profiling, validation, and map/reduce-style processing."
documentation = "https://docs.rs/rust-data-processing"
readme = "README_CRATE.md"
keywords = [
"csv",
"json",
"parquet",
"dataset",
"etl",
]
categories = [
"database-implementations",
"parser-implementations",
]
license = "MIT OR Apache-2.0"
repository = "https://github.com/vihangdesai2018-png/rust-data-processing"
[features]
arrow = ["dep:arrow"]
ci_expanded = [
"deep_tests",
"excel_test_writer",
"arrow",
"serde_arrow",
]
db_connectorx = [
"arrow",
"dep:connectorx",
"connectorx/src_postgres",
"connectorx/src_mysql",
"connectorx/src_mssql",
"connectorx/src_oracle",
]
deep_tests = []
default = ["sql"]
excel = ["dep:calamine"]
excel_test_writer = [
"excel",
"dep:rust_xlsxwriter",
]
serde_arrow = [
"arrow",
"dep:serde_arrow",
]
sql = ["dep:polars-sql"]
[lib]
name = "rust_data_processing"
path = "src/lib.rs"
[[bin]]
name = "rust-data-processing"
path = "src/main.rs"
[[test]]
name = "csv_ingestion"
path = "tests/csv_ingestion.rs"
[[test]]
name = "deep_tests"
path = "tests/deep_tests.rs"
[[test]]
name = "excel_ingestion"
path = "tests/excel_ingestion.rs"
[[test]]
name = "ingestion_observability"
path = "tests/ingestion_observability.rs"
[[test]]
name = "json_ingestion"
path = "tests/json_ingestion.rs"
[[test]]
name = "mapping_spec"
path = "tests/mapping_spec.rs"
[[test]]
name = "parquet_ingestion"
path = "tests/parquet_ingestion.rs"
[[test]]
name = "sql"
path = "tests/sql.rs"
[[test]]
name = "unified_ingestion"
path = "tests/unified_ingestion.rs"
[[bench]]
name = "ingestion"
path = "benches/ingestion.rs"
harness = false
[[bench]]
name = "map_reduce"
path = "benches/map_reduce.rs"
harness = false
[[bench]]
name = "outliers"
path = "benches/outliers.rs"
harness = false
[[bench]]
name = "pipelines"
path = "benches/pipelines.rs"
harness = false
[[bench]]
name = "profiling"
path = "benches/profiling.rs"
harness = false
[[bench]]
name = "validation"
path = "benches/validation.rs"
harness = false
[dependencies.arrow]
version = "54"
optional = true
[dependencies.calamine]
version = "0.33.0"
optional = true
[dependencies.connectorx]
version = "0.4.5"
features = [
"dst_arrow",
"fptr",
]
optional = true
default-features = false
[dependencies.csv]
version = "1.3.1"
[dependencies.parquet]
version = "57"
[dependencies.polars]
version = "0.53.0"
features = [
"lazy",
"csv",
"parquet",
"json",
"fmt",
]
[dependencies.polars-sql]
version = "0.53.0"
optional = true
[dependencies.rayon]
version = "1"
[dependencies.rust_xlsxwriter]
version = "0.93"
optional = true
[dependencies.serde]
version = "1"
features = ["derive"]
[dependencies.serde_arrow]
version = "0.14.0"
features = ["arrow-54"]
optional = true
default-features = false
[dependencies.serde_json]
version = "1.0.139"
[dependencies.thiserror]
version = "2.0.11"
[dev-dependencies.criterion]
version = "0.5"
[profile.test]
debug = 0