Skip to main content

Crate dongler_core

Crate dongler_core 

Source

Re-exports§

pub use archive::ArchiveEngine;
pub use csv::CsvEngine;
pub use engine::ExtractionEngine;
pub use engine::PlainTextEngine;
pub use error::DonglerError;
pub use error::Result;
pub use format::ExtractionStatus;
pub use format::InputFormat;
pub use image::ImageEngine;
pub use ir::Asset;
pub use ir::BBox;
pub use ir::BatchResult;
pub use ir::Block;
pub use ir::BlockKind;
pub use ir::Confidence;
pub use ir::Document;
pub use ir::ExtractOptions;
pub use ir::FigureBlock;
pub use ir::ImageObject;
pub use ir::Line;
pub use ir::Metadata;
pub use ir::Page;
pub use ir::Provenance;
pub use ir::Route;
pub use ir::SourceAnchor;
pub use ir::Span;
pub use ir::TableBlock;
pub use ir::TableCell;
pub use ir::TextBlock;
pub use ir::TextSource;
pub use ir::Warning;
pub use json::JsonEngine;
pub use openxml::OpenXmlEngine;
pub use pdf::PdfEngine;
pub use render::JsonRenderer;
pub use render::LatexRenderer;
pub use render::MarkdownRenderer;
pub use render::Renderer;
pub use source::FormatSourceLoader;
pub use source::ImageSourceLoader;
pub use source::PdfSourceLoader;
pub use source::Source;
pub use source::SourceLoader;
pub use source::TextSourceLoader;
pub use textual::EmailEngine;
pub use textual::HtmlEngine;
pub use textual::XmlEngine;

Modules§

archive
csv
engine
error
format
image
ir
json
openxml
pdf
render
source
textual

Functions§

detect_format
extract_bytes
Extract a document from in-memory bytes, detecting the format from filename (its extension only — the file is never read from disk).
extract_bytes_with_options
load_many
load_path
load_path_with_options
parse_text
to_json
to_latex
to_markdown