pub struct Dataset { /* private fields */ }Implementations§
Source§impl Dataset
impl Dataset
pub fn new(tokens: Vec<u32>, seq_len: usize) -> Self
Sourcepub fn from_file<P: AsRef<Path>>(
path: P,
tokenizer: &Tokenizer,
seq_len: usize,
) -> Result<Self>
pub fn from_file<P: AsRef<Path>>( path: P, tokenizer: &Tokenizer, seq_len: usize, ) -> Result<Self>
Load dataset from a JSONL file where each line has a “text” field. Supports .gz and .zst/.zstd compressed files.
Sourcepub fn from_stdin(tokenizer: &Tokenizer, seq_len: usize) -> Result<Self>
pub fn from_stdin(tokenizer: &Tokenizer, seq_len: usize) -> Result<Self>
Load dataset from stdin (JSONL format).
Sourcepub fn from_files<P: AsRef<Path>>(
paths: &[P],
tokenizer: &Tokenizer,
seq_len: usize,
) -> Result<Self>
pub fn from_files<P: AsRef<Path>>( paths: &[P], tokenizer: &Tokenizer, seq_len: usize, ) -> Result<Self>
Load dataset from multiple JSONL files. Supports .gz and .zst/.zstd compressed files.
pub fn len(&self) -> usize
pub fn is_empty(&self) -> bool
pub fn get_batch( &self, indices: &[usize], device: &Device, ) -> Result<(Tensor, Tensor)>
pub fn tokens(&self) -> &[u32]
Auto Trait Implementations§
impl Freeze for Dataset
impl RefUnwindSafe for Dataset
impl Send for Dataset
impl Sync for Dataset
impl Unpin for Dataset
impl UnsafeUnpin for Dataset
impl UnwindSafe for Dataset
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more