orbok-extract 0.3.0

orbok document extraction pipeline: extractor trait, normalization, text/markdown extractors (RFC-005)
Documentation
//! # orbok-extract
//!
//! Text extraction (RFC-005): pluggable extractors turn boundary-
//! validated source files into normalized, line-located segments.
//! Extraction output is derived data — cacheable, rebuildable, never
//! authoritative.

pub mod chunker;
pub mod normalize;
pub mod registry;
pub mod types;

mod markdown;
mod text;

#[cfg(test)]
mod tests;

pub use registry::ExtractorRegistry;
pub use chunker::chunk;
pub use types::{
    DocumentExtractor, ExtractOutput, ExtractedSegment, LocationQuality, SegmentKind,
};