servo_fetch/lib.rs
1//! Web content extraction library powered by Servo and Readability.
2//!
3//! This crate provides utilities for extracting readable content from HTML:
4//!
5//! - [`extract`] — Convert HTML into Markdown or structured JSON using
6//! Mozilla's Readability algorithm.
7//! - [`layout`] — CSS layout heuristics to detect and strip navbars,
8//! sidebars, and footers before extraction.
9//! - [`sanitize`] — Strip ANSI escape sequences and control characters
10//! from output strings.
11
12#![forbid(unsafe_code)]
13#![warn(missing_docs)]
14
15pub mod extract;
16pub mod layout;
17pub mod sanitize;