halldyll-core 0.1.0

Core scraping engine for Halldyll - high-performance async web scraper for AI agents
Documentation
//! Parse - Content extraction (text, links, images, videos, metadata)

pub mod router;
pub mod html;
pub mod text;
pub mod links;
pub mod images;
pub mod videos;
pub mod audios;
pub mod metadata;
pub mod jsonld;
pub mod opengraph;

pub use router::{ContentRouter, ContentType as ParsedContentType};
pub use html::HtmlParser;
pub use text::TextExtractor;
pub use links::LinkExtractor;
pub use images::ImageExtractor;
pub use videos::VideoExtractor;
pub use audios::AudioExtractor;
pub use metadata::MetadataExtractor;
pub use jsonld::JsonLdExtractor;
pub use opengraph::OpenGraphExtractor;