[package]
edition = "2021"
name = "pdf-ocr"
version = "1.0.0-beta.9"
build = false
autolib = false
autobins = false
autoexamples = false
autotests = false
autobenches = false
description = "OCR integration for scanned PDFs with pluggable engine support"
homepage = "https://pdfluent.com"
documentation = "https://pdfluent.com/docs"
readme = "README.md"
license-file = "LICENSE"
repository = "https://pdfluent.com/source"
[features]
default = []
paddle = [
"ort",
"ndarray",
"image",
"ureq",
"dirs-next",
]
tesseract = ["leptess"]
[lib]
name = "pdf_ocr"
path = "src/lib.rs"
[dependencies.dirs-next]
version = "2"
optional = true
[dependencies.image]
version = "0.25"
optional = true
[dependencies.leptess]
version = "0.14"
optional = true
[dependencies.lopdf]
version = "=0.39.4"
package = "pdfluent-lopdf"
[dependencies.ndarray]
version = "0.17"
optional = true
[dependencies.ort]
version = "=2.0.0-rc.12"
features = [
"std",
"ndarray",
"load-dynamic",
"api-24",
]
optional = true
default-features = false
[dependencies.thiserror]
version = "2"
[dependencies.ureq]
version = "3"
optional = true
[dev-dependencies.tempfile]
version = "3"