[dependencies.brotli]
version = "3.4"
[dependencies.bytes]
version = "1.5"
[dependencies.chrono]
features = ["serde"]
version = "0.4"
[dependencies.ego-tree]
version = "0.6"
[dependencies.encoding_rs]
version = "0.8"
[dependencies.flate2]
version = "1.0"
[dependencies.futures]
version = "0.3"
[dependencies.quick-xml]
version = "0.31"
[dependencies.rand]
version = "0.8"
[dependencies.regex]
version = "1.10"
[dependencies.reqwest]
features = ["gzip", "brotli", "deflate", "json", "stream", "cookies"]
version = "0.11"
[dependencies.scraper]
version = "0.18"
[dependencies.serde]
features = ["derive"]
version = "1.0"
[dependencies.serde_json]
version = "1.0"
[dependencies.sha2]
version = "0.10"
[dependencies.texting_robots]
version = "0.2"
[dependencies.thiserror]
version = "1.0"
[dependencies.tokio]
features = ["full"]
version = "1.35"
[dependencies.tracing]
version = "0.1"
[dependencies.tracing-subscriber]
features = ["json", "env-filter"]
version = "0.3"
[dependencies.url]
features = ["serde"]
version = "2.5"
[dependencies.uuid]
features = ["v4"]
version = "1.6"
[dev-dependencies.tempfile]
version = "3.9"
[dev-dependencies.tokio-test]
version = "0.4"
[dev-dependencies.wiremock]
version = "0.5"
[features]
browser = []
default = []
warc = []
[lib]
name = "halldyll_core"
path = "src/lib.rs"
[package]
authors = ["Geryan Roy <geryan.roy@icloud.com>"]
autobenches = false
autobins = false
autoexamples = false
autolib = false
autotests = false
build = false
categories = ["web-programming", "parsing"]
description = "Core scraping engine for Halldyll - high-performance async web scraper for AI agents"
documentation = "https://docs.rs/halldyll-core"
edition = "2021"
homepage = "https://github.com/Mr-soloDev/halldyll-Scrapper"
keywords = ["scraper", "crawler", "web", "ai", "async"]
license = "MIT"
name = "halldyll-core"
readme = "README.md"
repository = "https://github.com/Mr-soloDev/halldyll-Scrapper"
version = "0.1.0"
[[test]]
name = "crawl_tests"
path = "tests/crawl_tests.rs"
[[test]]
name = "parse_tests"
path = "tests/parse_tests.rs"
[[test]]
name = "security_tests"
path = "tests/security_tests.rs"
[[test]]
name = "types_tests"
path = "tests/types_tests.rs"