readabilityrs/
lib.rs

1//! # ReadabilityRS
2//!
3//! A Rust port of Mozilla's Readability library for extracting article content from web pages.
4//!
5//! This library is a faithful port of the [Mozilla Readability](https://github.com/mozilla/readability)
6//! JavaScript library, used in Firefox Reader View.
7//!
8//! ## Example
9//!
10//! ```rust,no_run
11//! use readabilityrs::{Readability, ReadabilityOptions};
12//!
13//! let html = r#"<html><body><article><h1>Title</h1><p>Content...</p></article></body></html>"#;
14//! let url = "https://example.com/article";
15//!
16//! let options = ReadabilityOptions::default();
17//! let readability = Readability::new(html, Some(url), Some(options)).unwrap();
18//!
19//! if let Some(article) = readability.parse() {
20//!     println!("Title: {:?}", article.title);
21//!     println!("Content: {:?}", article.content);
22//! }
23//! ```
24
25mod article;
26mod cleaner;
27mod constants;
28mod content_extractor;
29mod dom_utils;
30mod error;
31mod metadata;
32mod options;
33mod post_processor;
34mod readability;
35mod readerable;
36mod scoring;
37mod utils;
38
39// Public exports
40pub use article::Article;
41pub use error::{ReadabilityError, Result};
42pub use options::ReadabilityOptions;
43pub use readability::Readability;
44pub use readerable::is_probably_readerable;