pub struct CitlDataLoader { /* private fields */ }Expand description
CITL DataLoader using alimentar for efficient data loading
Implementations§
Source§impl CitlDataLoader
impl CitlDataLoader
Sourcepub fn with_config(config: CitlLoaderConfig) -> Self
pub fn with_config(config: CitlLoaderConfig) -> Self
Create a new CITL DataLoader with custom configuration
Sourcepub fn batch_size(self, size: usize) -> Self
pub fn batch_size(self, size: usize) -> Self
Set batch size
Sourcepub fn min_confidence(self, confidence: f32) -> Self
pub fn min_confidence(self, confidence: f32) -> Self
Set minimum confidence threshold
Sourcepub fn merge_strategy(self, strategy: MergeStrategy) -> Self
pub fn merge_strategy(self, strategy: MergeStrategy) -> Self
Set merge strategy
Sourcepub fn load_parquet<P: AsRef<Path>>(&self, path: P) -> Result<CitlBatchIterator>
pub fn load_parquet<P: AsRef<Path>>(&self, path: P) -> Result<CitlBatchIterator>
Load CITL corpus from Parquet file using alimentar
Returns an iterator over batches of TrainingExamples
Sourcepub fn load_jsonl<P: AsRef<Path>>(
&self,
path: P,
) -> Result<(Vec<TrainingExample>, ImportStats)>
pub fn load_jsonl<P: AsRef<Path>>( &self, path: P, ) -> Result<(Vec<TrainingExample>, ImportStats)>
Load CITL corpus from JSONL file (streaming)
Sourcepub fn config(&self) -> &CitlLoaderConfig
pub fn config(&self) -> &CitlLoaderConfig
Get the configuration
Trait Implementations§
Auto Trait Implementations§
impl Freeze for CitlDataLoader
impl RefUnwindSafe for CitlDataLoader
impl Send for CitlDataLoader
impl Sync for CitlDataLoader
impl Unpin for CitlDataLoader
impl UnwindSafe for CitlDataLoader
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> Pointable for T
impl<T> Pointable for T
Source§impl<T> PolicyExt for Twhere
T: ?Sized,
impl<T> PolicyExt for Twhere
T: ?Sized,
Source§impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
Source§fn to_subset(&self) -> Option<SS>
fn to_subset(&self) -> Option<SS>
The inverse inclusion map: attempts to construct
self from the equivalent element of its
superset. Read moreSource§fn is_in_subset(&self) -> bool
fn is_in_subset(&self) -> bool
Checks if
self is actually part of its subset T (and can be converted to it).Source§fn to_subset_unchecked(&self) -> SS
fn to_subset_unchecked(&self) -> SS
Use with care! Same as
self.to_subset but without any property checks. Always succeeds.Source§fn from_subset(element: &SS) -> SP
fn from_subset(element: &SS) -> SP
The inclusion map: converts
self to the equivalent element of its superset.