kreuzberg 4.4.2

High-performance document intelligence library for Rust. Extract text, metadata, and structured data from PDFs, Office documents, images, and 75+ formats with async/sync APIs.
Documentation
//! PDF-to-Markdown renderer using segment-level font analysis.
//!
//! Converts PDF documents into structured markdown by analyzing pdfium text segments
//! (pre-merged character runs sharing baseline + font settings) to reconstruct headings,
//! paragraphs, inline formatting, and list items.

mod assembly;
mod bridge;
mod classify;
mod columns;
mod constants;
mod lines;
mod paragraphs;
mod pipeline;
mod render;
mod types;

pub use pipeline::render_document_as_markdown_with_tables;
pub use render::inject_image_placeholders;