harper_core

Struct Document

source
pub struct Document { /* private fields */ }
Expand description

A document containing some amount of lexed and parsed English text.

Implementations§

source§

impl Document

source

pub fn new( text: &str, parser: &mut impl Parser, dictionary: &impl Dictionary, ) -> Self

Lexes and parses text to produce a document using a provided language parser and dictionary.

source

pub fn new_curated(text: &str, parser: &mut impl Parser) -> Self

Lexes and parses text to produce a document using a provided language parser and the included curated dictionary.

source

pub fn new_from_vec( source: Lrc<Vec<char>>, parser: &mut impl Parser, dictionary: &impl Dictionary, ) -> Self

Lexes and parses text to produce a document using a provided language parser and dictionary.

source

pub fn new_plain_english_curated(text: &str) -> Self

Parse text to produce a document using the built-in PlainEnglish parser and curated dictionary.

source

pub fn new_plain_english(text: &str, dictionary: &impl Dictionary) -> Self

Parse text to produce a document using the built-in PlainEnglish parser and a provided dictionary.

source

pub fn new_markdown_curated(text: &str) -> Self

Parse text to produce a document using the built-in Markdown parser and curated dictionary.

source

pub fn new_markdown(text: &str, dictionary: &impl Dictionary) -> Self

Parse text to produce a document using the built-in PlainEnglish parser and the curated dictionary.

source

pub fn get_token_at_char_index(&self, char_index: usize) -> Option<Token>

source

pub fn get_token(&self, index: usize) -> Option<Token>

Defensively attempt to grab a specific token.

source

pub fn tokens(&self) -> impl Iterator<Item = Token> + '_

Get an iterator over all the tokens contained in the document.

source

pub fn fat_tokens(&self) -> impl Iterator<Item = FatToken> + '_

Get an iterator over all the tokens contained in the document.

source

pub fn chunks(&self) -> impl Iterator<Item = &[Token]> + '_

Iterate over chunks.

For example, the following sentence contains two chunks separated by a comma:

Here is an example, it is short.
source

pub fn sentences(&self) -> impl Iterator<Item = &[Token]> + '_

Get an iterator over token slices that represent the individual sentences in a document.

source

pub fn get_span_content(&self, span: Span) -> &[char]

source

pub fn get_span_content_str(&self, span: Span) -> String

source

pub fn get_full_string(&self) -> String

source

pub fn get_full_content(&self) -> &[char]

source

pub fn get_source(&self) -> &[char]

source

pub fn get_tokens(&self) -> &[Token]

Trait Implementations§

source§

impl Clone for Document

source§

fn clone(&self) -> Document

Returns a copy of the value. Read more
1.0.0 · source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
source§

impl Debug for Document

source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
source§

impl Default for Document

source§

fn default() -> Self

Returns the “default value” for a type. Read more
source§

impl Display for Document

source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
source§

impl TokenStringExt for Document

source§

fn first_word(&self) -> Option<Token>

source§

fn last_word(&self) -> Option<Token>

source§

fn iter_word_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_words(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_space(&self) -> Option<Token>

source§

fn last_space(&self) -> Option<Token>

source§

fn iter_space_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_spaces(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_apostrophe(&self) -> Option<Token>

source§

fn last_apostrophe(&self) -> Option<Token>

source§

fn iter_apostrophe_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_apostrophes(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_pipe(&self) -> Option<Token>

source§

fn last_pipe(&self) -> Option<Token>

source§

fn iter_pipe_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_pipes(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_quote(&self) -> Option<Token>

source§

fn last_quote(&self) -> Option<Token>

source§

fn iter_quote_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_quotes(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_number(&self) -> Option<Token>

source§

fn last_number(&self) -> Option<Token>

source§

fn iter_number_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_numbers(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_at(&self) -> Option<Token>

source§

fn last_at(&self) -> Option<Token>

source§

fn iter_at_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_ats(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_ellipsis(&self) -> Option<Token>

source§

fn last_ellipsis(&self) -> Option<Token>

source§

fn iter_ellipsis_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_ellipsiss(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_unlintable(&self) -> Option<Token>

source§

fn last_unlintable(&self) -> Option<Token>

source§

fn iter_unlintable_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_unlintables(&self) -> impl Iterator<Item = Token> + '_

source§

fn first_sentence_word(&self) -> Option<Token>

source§

fn first_non_whitespace(&self) -> Option<Token>

source§

fn span(&self) -> Option<Span>

Grab the span that represents the beginning of the first element and the end of the last element.
source§

fn iter_linking_verb_indices(&self) -> impl Iterator<Item = usize> + '_

source§

fn iter_linking_verbs(&self) -> impl Iterator<Item = Token> + '_

Auto Trait Implementations§

Blanket Implementations§

source§

impl<T> Any for T
where T: 'static + ?Sized,

source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
source§

impl<T> Borrow<T> for T
where T: ?Sized,

source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
source§

impl<T> CloneToUninit for T
where T: Clone,

source§

unsafe fn clone_to_uninit(&self, dst: *mut T)

🔬This is a nightly-only experimental API. (clone_to_uninit)
Performs copy-assignment from self to dst. Read more
source§

impl<T> From<T> for T

source§

fn from(t: T) -> T

Returns the argument unchanged.

source§

impl<T, U> Into<U> for T
where U: From<T>,

source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

source§

impl<T> IntoEither for T

source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
source§

impl<T> ToOwned for T
where T: Clone,

source§

type Owned = T

The resulting type after obtaining ownership.
source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
source§

impl<T> ToString for T
where T: Display + ?Sized,

source§

default fn to_string(&self) -> String

Converts the given value to a String. Read more
source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

source§

type Error = Infallible

The type returned in the event of a conversion error.
source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.