[package]
edition = "2021"
rust-version = "1.74"
name = "qrawl"
version = "0.6.0"
build = false
include = [
"Cargo.toml",
"README.md",
"LICENSE*",
"src/**",
]
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "Rust toolkit to crawl web data for AI agents"
homepage = "https://github.com/QLangstaff/qrawl"
documentation = "https://docs.rs/qrawl"
readme = "README.md"
keywords = [
"crawler",
"web-crawling",
"scraper",
"web-scraping",
"rag",
]
categories = [
"web-programming::http-client",
"parsing",
"asynchronous",
"command-line-utilities",
]
license = "MIT"
repository = "https://github.com/QLangstaff/qrawl"
[lib]
name = "qrawl"
path = "src/lib.rs"
[[bin]]
name = "qrawl"
path = "src/bin/qrawl.rs"
[dependencies.async-trait]
version = "0.1"
[dependencies.clap]
version = "4.5"
features = ["derive"]
[dependencies.dashmap]
version = "6.0"
[dependencies.futures-util]
version = "0.3"
[dependencies.html-escape]
version = "0.2"
[dependencies.idna]
version = "0.5"
[dependencies.once_cell]
version = "1.19"
[dependencies.regex]
version = "1.10"
[dependencies.reqwest]
version = "0.11"
features = [
"blocking",
"cookies",
"brotli",
"gzip",
"deflate",
"json",
"native-tls",
"stream",
]
[dependencies.scraper]
version = "0.19"
[dependencies.serde]
version = "1.0"
features = ["derive"]
[dependencies.serde_json]
version = "1.0"
[dependencies.tokio]
version = "1.0"
features = [
"rt",
"rt-multi-thread",
"macros",
"time",
"sync",
]
[dependencies.unicode-normalization]
version = "0.1"
[dependencies.url]
version = "2"
[dependencies.urlencoding]
version = "2.1"