name: pdftotext
binary: pdftotext
aliases: []
category:
- docs
- text
- file-viewer
lang:
- all
platform:
- local
summary: Poppler CLI for extracting text from PDF files.
homepage: https://poppler.freedesktop.org/
docs: https://www.mankier.com/1/pdftotext
detect:
version_args:
- -v
local:
files: []
dirs: []
package_json:
package_manager_prefixes: []
use_when:
- Extract text from PDFs for reading, summarization, or search
avoid_when:
- The PDF is scanned images and needs OCR
risk:
level: low
effects:
- read_files
- write_files
requires_auth: false
destructive: false
confirmation_required_for: []
guardrails:
- Use OCR tools for image-only PDFs when extracted text is empty or garbled.