Struct graphannis::CorpusStorage

source ·

pub struct CorpusStorage { /* private fields */ }

Expand description

A thread-safe API for managing corpora stored in a common location on the file system.

Multiple corpora can be part of a corpus storage and they are identified by their unique name. Corpora are loaded from disk into main memory on demand: An internal main memory cache is used to avoid re-loading a recently queried corpus from disk again.

Struct graphannis::CorpusStorageCopy item path

Implementations§

impl CorpusStorage

pub fn with_cache_strategy( db_dir: &Path, cache_strategy: CacheStrategy, use_parallel_joins: bool ) -> Result<CorpusStorage>

pub fn with_auto_cache_size( db_dir: &Path, use_parallel_joins: bool ) -> Result<CorpusStorage>

pub fn list(&self) -> Result<Vec<CorpusInfo>>

pub fn info(&self, corpus_name: &str) -> Result<CorpusInfo>

pub fn import_all_from_zip<R, F>( &self, zip_file: R, disk_based: bool, overwrite_existing: bool, progress_callback: F ) -> Result<Vec<String>>where R: Read + Seek, F: Fn(&str),

pub fn import_from_fs<F>( &self, path: &Path, format: ImportFormat, corpus_name: Option<String>, disk_based: bool, overwrite_existing: bool, progress_callback: F ) -> Result<String>where F: Fn(&str),

pub fn export_to_zip<W, F>( &self, corpus_name: &str, use_corpus_subdirectory: bool, zip: &mut ZipWriter<W>, progress_callback: F ) -> Result<()>where W: Write + Seek, F: Fn(&str),

pub fn export_to_fs<S: AsRef<str>>( &self, corpora: &[S], path: &Path, format: ExportFormat ) -> Result<()>

pub fn delete(&self, corpus_name: &str) -> Result<bool>

pub fn create_empty_corpus( &self, corpus_name: &str, disk_based: bool ) -> Result<bool>

pub fn apply_update( &self, corpus_name: &str, update: &mut GraphUpdate ) -> Result<()>

pub fn preload(&self, corpus_name: &str) -> Result<()>

pub fn unload(&self, corpus_name: &str) -> Result<()>

pub fn validate_query<S: AsRef<str>>( &self, corpus_names: &[S], query: &str, query_language: QueryLanguage ) -> Result<bool>

pub fn plan<S: AsRef<str>>( &self, corpus_names: &[S], query: &str, query_language: QueryLanguage ) -> Result<String>

pub fn count<S: AsRef<str>>(&self, query: SearchQuery<'_, S>) -> Result<u64>

pub fn count_extra<S: AsRef<str>>( &self, query: SearchQuery<'_, S> ) -> Result<CountExtra>

pub fn find<S: AsRef<str>>( &self, query: SearchQuery<'_, S>, offset: usize, limit: Option<usize>, order: ResultOrder ) -> Result<Vec<String>>

pub fn subgraph( &self, corpus_name: &str, node_ids: Vec<String>, ctx_left: usize, ctx_right: usize, segmentation: Option<String> ) -> Result<AnnotationGraph>

§Handling of gaps

pub fn subgraph_for_query( &self, corpus_name: &str, query: &str, query_language: QueryLanguage, component_type_filter: Option<AnnotationComponentType> ) -> Result<AnnotationGraph>

pub fn subcorpus_graph( &self, corpus_name: &str, corpus_ids: Vec<String> ) -> Result<AnnotationGraph>

pub fn corpus_graph(&self, corpus_name: &str) -> Result<AnnotationGraph>

pub fn frequency<S: AsRef<str>>( &self, query: SearchQuery<'_, S>, definition: Vec<FrequencyDefEntry> ) -> Result<FrequencyTable<String>>

pub fn node_descriptions( &self, query: &str, query_language: QueryLanguage ) -> Result<Vec<QueryAttributeDescription>>

pub fn list_components( &self, corpus_name: &str, ctype: Option<AnnotationComponentType>, name: Option<&str> ) -> Result<Vec<Component<AnnotationComponentType>>>

pub fn list_node_annotations( &self, corpus_name: &str, list_values: bool, only_most_frequent_values: bool ) -> Result<Vec<Annotation>>

pub fn list_edge_annotations( &self, corpus_name: &str, component: &Component<AnnotationComponentType>, list_values: bool, only_most_frequent_values: bool ) -> Result<Vec<Annotation>>

Trait Implementations§

impl Drop for CorpusStorage

fn drop(&mut self)

Auto Trait Implementations§

impl !Freeze for CorpusStorage

impl RefUnwindSafe for CorpusStorage

impl Send for CorpusStorage

impl Sync for CorpusStorage

impl Unpin for CorpusStorage

impl UnwindSafe for CorpusStorage

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize = _

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> Same for T

type Output = T

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct graphannis::CorpusStorage

pub fn import_all_from_zip<R, F>( &self, zip_file: R, disk_based: bool, overwrite_existing: bool, progress_callback: F ) -> Result<Vec<String>>
where R: Read + Seek, F: Fn(&str),

pub fn import_from_fs<F>( &self, path: &Path, format: ImportFormat, corpus_name: Option<String>, disk_based: bool, overwrite_existing: bool, progress_callback: F ) -> Result<String>
where F: Fn(&str),

pub fn export_to_zip<W, F>( &self, corpus_name: &str, use_corpus_subdirectory: bool, zip: &mut ZipWriter<W>, progress_callback: F ) -> Result<()>
where W: Write + Seek, F: Fn(&str),

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,