Struct Trainer

Source

pub struct Trainer;

Expand description

Primary entry point for training in flodl.

Trainer is the default API for training a model, whether you have one GPU, many GPUs, or no GPU at all. The training loop is identical in all cases: Trainer::setup (or Trainer::builder) configures the model, detects the hardware, and enables distributed training automatically when multiple CUDA devices are available. On a single GPU or CPU it’s a no-op wrapper with zero DDP overhead.

For explicit multi-GPU control (manual gradient sync, custom replica wrapping) use Ddp directly. Ddp::wrap remains the entry point for advanced patterns (GAN, RL, progressive).

§Setup mode (user owns the loop)

Trainer::setup(&model, |dev| build_model(dev), |p| Adam::new(p, 0.001))?;

for (x, y) in &train_loader {
    let out = model.forward(&x)?;
    let loss = cross_entropy_loss(&out, &y)?;
    loss.backward()?;
    model.step()?;
}

§Builder mode (framework owns the loop)

let handle = Trainer::builder(model_factory, optim_factory, train_fn)
    .dataset(dataset)
    .batch_size(32)
    .num_epochs(10)
    .run()?;

let state = handle.join()?;

Trainer

Struct Trainer Copy item path

§Setup mode (user owns the loop)

§Builder mode (framework owns the loop)

Implementations§

impl Trainer

pub fn setup<F, M, G, O>(model: &Graph, builder: F, optimizer: G) -> Result<()>where F: Fn(Device) -> Result<M>, M: Module + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

pub fn setup_with<F, M, G, O>( model: &Graph, builder: F, optimizer: G, config: DdpConfig, ) -> Result<()>where F: Fn(Device) -> Result<M>, M: Module + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

§Example

pub fn setup_head<H, F, G, O>( head: &H, head_factory: F, optimizer: G, ) -> Result<()>where H: HasGraph + 'static, F: Fn(Device) -> Result<H> + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

pub fn setup_head_with<H, F, G, O>( head: &H, head_factory: F, optimizer: G, config: DdpConfig, ) -> Result<()>where H: HasGraph + 'static, F: Fn(Device) -> Result<H> + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

Auto Trait Implementations§

impl Freeze for Trainer

impl RefUnwindSafe for Trainer

impl Send for Trainer

impl Sync for Trainer

impl Unpin for Trainer

impl UnsafeUnpin for Trainer

impl UnwindSafe for Trainer

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct Trainer

pub fn setup<F, M, G, O>(model: &Graph, builder: F, optimizer: G) -> Result<()>
where F: Fn(Device) -> Result<M>, M: Module + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

pub fn setup_with<F, M, G, O>( model: &Graph, builder: F, optimizer: G, config: DdpConfig, ) -> Result<()>
where F: Fn(Device) -> Result<M>, M: Module + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

pub fn setup_head<H, F, G, O>( head: &H, head_factory: F, optimizer: G, ) -> Result<()>
where H: HasGraph + 'static, F: Fn(Device) -> Result<H> + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

pub fn setup_head_with<H, F, G, O>( head: &H, head_factory: F, optimizer: G, config: DdpConfig, ) -> Result<()>
where H: HasGraph + 'static, F: Fn(Device) -> Result<H> + 'static, G: Fn(&[Parameter]) -> O, O: Optimizer + 'static,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,