[package]
edition = "2024"
name = "decruft"
version = "0.1.1"
build = false
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Extract clean, readable content from web pages"
homepage = "https://github.com/jamtur01/decruft"
documentation = "https://docs.rs/decruft"
readme = "README.md"
keywords = [
"html",
"content-extraction",
"readability",
"scraping",
"web",
]
categories = [
"command-line-utilities",
"parser-implementations",
"web-programming",
]
license = "MIT"
repository = "https://github.com/jamtur01/decruft"
[package.metadata.docs.rs]
all-features = true
rustdoc-args = [
"--cfg",
"docsrs",
]
[lib]
name = "decruft"
path = "src/lib.rs"
[[bin]]
name = "decruft"
path = "src/main.rs"
[[test]]
name = "cli"
path = "tests/cli.rs"
[[test]]
name = "defuddle_behavior"
path = "tests/defuddle_behavior.rs"
[[test]]
name = "defuddle_fixtures"
path = "tests/defuddle_fixtures.rs"
[[test]]
name = "integration"
path = "tests/integration.rs"
[[test]]
name = "output_formats"
path = "tests/output_formats.rs"
[[bench]]
name = "extraction"
path = "benches/extraction.rs"
harness = false
[dependencies.clap]
version = "4.6.0"
features = ["derive"]
[dependencies.ego-tree]
version = "0.11.0"
[dependencies.fancy-regex]
version = "0.17.0"
[dependencies.htmd]
version = "0.5.4"
[dependencies.markup5ever]
version = "0.39.0"
[dependencies.regex]
version = "1.12.3"
[dependencies.scraper]
version = "0.26.0"
[dependencies.serde]
version = "1.0.228"
features = ["derive"]
[dependencies.serde_json]
version = "1.0.149"
[dependencies.ureq]
version = "3.3.0"
[dependencies.url]
version = "2.5.8"
[dev-dependencies.criterion]
version = "0.8.2"
features = ["html_reports"]
[lints.clippy]
allow_attributes = "deny"
dbg_macro = "deny"
module_name_repetitions = "allow"
panic = "deny"
print_stderr = "deny"
print_stdout = "deny"
similar_names = "allow"
todo = "deny"
unwrap_used = "deny"
[lints.clippy.pedantic]
level = "warn"
priority = -1