1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
// Copyright (c) 2026 vectorless developers
// SPDX-License-Identifier: Apache-2.0
//! Table of Contents (TOC) processing module.
//!
//! This module provides functionality to extract and verify document structure
//! from PDF Table of Contents:
//!
//! - **Detection** — Find TOC in document (regex + LLM fallback)
//! - **Parsing** — Convert TOC text to structured entries (LLM)
//! - **Assignment** — Map TOC pages to physical pages
//! - **Verification** — Sample verification of page assignments
//! - **Repair** — Fix incorrect assignments
//!
//! # Architecture
//!
//! ```text
//! PDF Pages
//! │
//! ▼
//! ┌─────────────────────────────────────────────────┐
//! │ TocProcessor │
//! │ │
//! │ ┌─────────┐ ┌─────────┐ ┌─────────┐ │
//! │ │Detector │─▶│ Parser │─▶│Assigner │ │
//! │ └─────────┘ └─────────┘ └────┬────┘ │
//! │ │ │
//! │ ▼ │
//! │ ┌─────────────┐ │
//! │ │ Verifier │ │
//! │ └──────┬──────┘ │
//! │ │ │
//! │ ▼ │
//! │ ┌─────────────┐ │
//! │ │ Repairer │ │
//! │ └─────────────┘ │
//! └─────────────────────────────────────────────────┘
//! │
//! ▼
//! Vec<TocEntry>
//! ```
//!
//! # Example
//!
//! ```rust,no_run
//! use vectorless::parser::toc::TocProcessor;
//! use vectorless::parser::pdf::{PdfParser, PdfPage};
//!
//! # #[tokio::main]
//! # async fn main() -> vectorless::Result<()> {
//! // Parse PDF
//! let pdf_parser = PdfParser::new();
//! let result = pdf_parser.parse_file("document.pdf".as_ref())?;
//!
//! // Extract TOC
//! let processor = TocProcessor::new();
//! let entries = processor.process(&result.pages).await?;
//!
//! // Use entries
//! for entry in &entries {
//! println!("{} - Page {:?}", entry.title, entry.physical_page);
//! }
//! # Ok(())
//! # }
//! ```
// Re-export main types
pub use ;
// Re-export components
pub use ;
pub use ;
pub use ;
pub use ;
pub use ;
pub use ;