pub struct EpubFileLoader<'a, T, P = RawTextProcessor> { /* private fields */ }
epub
only.Expand description
EpubFileLoader is a utility for loading epub files from the filesystem using glob patterns or directory paths. It provides methods to read file contents and handle errors gracefully.
§Errors
This module defines a custom error type EpubLoaderError which can represent various errors that might occur during file loading operations, such as any FileLoaderError alongside specific EPUB-related errors.
§Example Usage
use rig::loaders::{EpubFileLoader, RawTextProcessor, StripXmlProcessor};
fn main() -> Result<(), Box<dyn std::error::Error>> {
// Create a FileLoader using a glob pattern
let loader = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?;
// Load epub file contents by chapter, ignoring any errors
let contents = loader
.load_with_path()
.ignore_errors()
.by_chapter()
.ignore_errors();
for (path, chapters) in contents {
println!("{}", path.display());
for (idx, chapter) in chapters {
println!("Chapter {} begins", idx);
println!("{}", chapter);
println!("Chapter {} ends", idx);
}
}
// Create a FileLoader using a glob pattern with stripping xml
let loader = EpubFileLoader::<_, StripXmlProcessor>::with_glob("tests/data/*.epub")?;
// Load epub file contents by chapter, ignoring any errors
let contents = loader
.load_with_path()
.ignore_errors()
.by_chapter()
.ignore_errors();
for (path, chapters) in contents {
println!("{}", path.display());
for (idx, chapter) in chapters {
println!("Chapter {} begins", idx);
println!("{}", chapter);
println!("Chapter {} ends", idx);
}
}
Ok(())
}
EpubFileLoader uses strict typing between the iterator methods to ensure that transitions between different implementations of the loaders and it’s methods are handled properly by the compiler.
Implementations§
Source§impl<'a, P> EpubFileLoader<'a, Result<PathBuf, EpubLoaderError>, P>
impl<'a, P> EpubFileLoader<'a, Result<PathBuf, EpubLoaderError>, P>
Sourcepub fn load(
self,
) -> EpubFileLoader<'a, Result<EpubDoc<BufReader<File>>, EpubLoaderError>, P>
pub fn load( self, ) -> EpubFileLoader<'a, Result<EpubDoc<BufReader<File>>, EpubLoaderError>, P>
Loads the contents of the epub files within the iterator returned by EpubFileLoader::with_glob or EpubFileLoader::with_dir. Loaded EPUB documents are raw EPUB instances that can be further processed (by chapter, etc).
§Example
Load epub files in directory “tests/data/*.epub” and return the loaded documents
use rig::loaders::EpubFileLoader;
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?.load().into_iter();
for result in content {
match result {
Ok(doc) => println!("{:?}", doc),
Err(e) => eprintln!("Error reading epub: {}", e),
}
}
Sourcepub fn load_with_path(
self,
) -> EpubFileLoader<'a, Result<(PathBuf, EpubDoc<BufReader<File>>), EpubLoaderError>, P>
pub fn load_with_path( self, ) -> EpubFileLoader<'a, Result<(PathBuf, EpubDoc<BufReader<File>>), EpubLoaderError>, P>
Loads the contents of the epub files within the iterator returned by EpubFileLoader::with_glob or EpubFileLoader::with_dir. Loaded EPUB documents are raw EPUB instances with their path that can be further processed.
§Example
Load epub files in directory “tests/data/*.epub” and return the loaded documents
use rig::loaders::EpubFileLoader;
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub").unwrap().load_with_path().into_iter();
for result in content {
match result {
Ok((path, doc)) => println!("{:?} {:?}", path, doc),
Err(e) => eprintln!("Error reading epub: {}", e),
}
}
Source§impl<'a, P> EpubFileLoader<'a, Result<PathBuf, EpubLoaderError>, P>where
P: TextProcessor,
impl<'a, P> EpubFileLoader<'a, Result<PathBuf, EpubLoaderError>, P>where
P: TextProcessor,
Sourcepub fn read(self) -> EpubFileLoader<'a, Result<String, EpubLoaderError>, P>
pub fn read(self) -> EpubFileLoader<'a, Result<String, EpubLoaderError>, P>
Directly reads the contents of the epub files within the iterator returned by EpubFileLoader::with_glob or EpubFileLoader::with_dir.
§Example
Read epub files in directory “tests/data/*.epub” and return the contents of the documents.
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?.read().into_iter();
for result in content {
match result {
Ok(content) => println!("{}", content),
Err(e) => eprintln!("Error reading epub: {}", e),
}
}
Sourcepub fn read_with_path(
self,
) -> EpubFileLoader<'a, Result<(PathBuf, String), EpubLoaderError>, P>
pub fn read_with_path( self, ) -> EpubFileLoader<'a, Result<(PathBuf, String), EpubLoaderError>, P>
Directly reads the contents of the epub files within the iterator returned by EpubFileLoader::with_glob or EpubFileLoader::with_dir and returns the path along with the content.
§Example
Read epub files in directory “tests/data/*.epub” and return the content and paths of the documents.
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?.read_with_path().into_iter();
for result in content {
match result {
Ok((path, content)) => println!("{:?} {}", path, content),
Err(e) => eprintln!("Error reading epub: {}", e),
}
}
Source§impl<'a, P> EpubFileLoader<'a, EpubDoc<BufReader<File>>, P>where
P: TextProcessor + 'a,
impl<'a, P> EpubFileLoader<'a, EpubDoc<BufReader<File>>, P>where
P: TextProcessor + 'a,
Sourcepub fn by_chapter(
self,
) -> EpubFileLoader<'a, Result<String, EpubLoaderError>, P>
pub fn by_chapter( self, ) -> EpubFileLoader<'a, Result<String, EpubLoaderError>, P>
Chunks the chapters of a loaded document by chapter, flattened as a single vector.
§Example
Load epub files in directory “tests/data/*.epub” and chunk all document into it’s chapters.
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?.load().by_chapter().into_iter();
for result in content {
println!("{}", result);
}
Source§impl<'a, P: TextProcessor> EpubFileLoader<'a, (PathBuf, EpubDoc<BufReader<File>>), P>
impl<'a, P: TextProcessor> EpubFileLoader<'a, (PathBuf, EpubDoc<BufReader<File>>), P>
Sourcepub fn by_chapter(
self,
) -> EpubFileLoader<'a, (PathBuf, Vec<(usize, Result<String, EpubLoaderError>)>), P>
pub fn by_chapter( self, ) -> EpubFileLoader<'a, (PathBuf, Vec<(usize, Result<String, EpubLoaderError>)>), P>
Chunks the chapters of a loaded document by chapter, processed as a vector of documents by path which each document container an inner vector of chapters by chapter number.
§Example
Read epub files in directory “tests/data/*.epub” and chunk all documents by path by it’s chapters.
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?
.load_with_path()
.ignore_errors()
.by_chapter()
.ignore_errors()
.into_iter();
for result in content {
println!("{:?}", result);
}
Source§impl<'a, P> EpubFileLoader<'a, (PathBuf, Vec<(usize, Result<String, EpubLoaderError>)>), P>where
P: TextProcessor,
impl<'a, P> EpubFileLoader<'a, (PathBuf, Vec<(usize, Result<String, EpubLoaderError>)>), P>where
P: TextProcessor,
Sourcepub fn ignore_errors(
self,
) -> EpubFileLoader<'a, (PathBuf, Vec<(usize, String)>), P>
pub fn ignore_errors( self, ) -> EpubFileLoader<'a, (PathBuf, Vec<(usize, String)>), P>
Ignores errors in the iterator, returning only successful results. This can be used on any EpubFileLoader state of iterator whose items are results.
§Example
Read files in directory “tests/data/*.epub” and ignore errors from unreadable files.
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?.read().ignore_errors().into_iter();
for result in content {
println!("{}", content)
}
Source§impl<'a, P, T: 'a> EpubFileLoader<'a, Result<T, EpubLoaderError>, P>
impl<'a, P, T: 'a> EpubFileLoader<'a, Result<T, EpubLoaderError>, P>
Sourcepub fn ignore_errors(self) -> EpubFileLoader<'a, T, P>
pub fn ignore_errors(self) -> EpubFileLoader<'a, T, P>
Ignores errors in the iterator, returning only successful results. This can be used on any EpubFileLoader state of iterator whose items are results.
§Example
Read files in directory “tests/data/*.epub” and ignore errors from unreadable files.
let content = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?.read().ignore_errors().into_iter();
for result in content {
println!("{}", content)
}
Source§impl<P> EpubFileLoader<'_, Result<PathBuf, FileLoaderError>, P>
impl<P> EpubFileLoader<'_, Result<PathBuf, FileLoaderError>, P>
Sourcepub fn with_glob(
pattern: &str,
) -> Result<EpubFileLoader<'_, Result<PathBuf, EpubLoaderError>, P>, EpubLoaderError>
pub fn with_glob( pattern: &str, ) -> Result<EpubFileLoader<'_, Result<PathBuf, EpubLoaderError>, P>, EpubLoaderError>
Creates a new EpubFileLoader using a glob pattern to match files.
§Example
Create a EpubFileLoader for all .epub
files that match the glob “tests/data/*.epub”.
let loader = EpubFileLoader::<_, RawTextProcessor>::with_glob("tests/data/*.epub")?;
Sourcepub fn with_dir(
directory: &str,
) -> Result<EpubFileLoader<'_, Result<PathBuf, EpubLoaderError>, P>, EpubLoaderError>
pub fn with_dir( directory: &str, ) -> Result<EpubFileLoader<'_, Result<PathBuf, EpubLoaderError>, P>, EpubLoaderError>
Creates a new EpubFileLoader on all files within a directory.
§Example
Create a EpubFileLoader for all files that are in the directory “files”.
let loader = EpubFileLoader::<_, RawTextProcessor>::with_dir("files")?;
Trait Implementations§
Source§impl<'a, T, P> IntoIterator for EpubFileLoader<'a, T, P>
impl<'a, T, P> IntoIterator for EpubFileLoader<'a, T, P>
Auto Trait Implementations§
impl<'a, T, P> Freeze for EpubFileLoader<'a, T, P>
impl<'a, T, P = RawTextProcessor> !RefUnwindSafe for EpubFileLoader<'a, T, P>
impl<'a, T, P = RawTextProcessor> !Send for EpubFileLoader<'a, T, P>
impl<'a, T, P = RawTextProcessor> !Sync for EpubFileLoader<'a, T, P>
impl<'a, T, P> Unpin for EpubFileLoader<'a, T, P>where
P: Unpin,
impl<'a, T, P = RawTextProcessor> !UnwindSafe for EpubFileLoader<'a, T, P>
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left
is true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self
into a Left
variant of Either<Self, Self>
if into_left(&self)
returns true
.
Converts self
into a Right
variant of Either<Self, Self>
otherwise. Read more