Struct DistributedDataParallel

Source

pub struct DistributedDataParallel<M: Module> { /* private fields */ }

Expand description

Wrapper that enables distributed data parallel training.

DDP replicates the model across multiple processes and synchronizes gradients during the backward pass.

Implementations§

Source §

impl<M: Module> DistributedDataParallel<M>

Source

pub fn new(module: M, process_group: ProcessGroup) -> Self

Creates a new DDP wrapper.

Source

pub fn broadcast_buffers(self, broadcast: bool) -> Self

Sets whether to broadcast buffers from rank 0.

Source

pub fn gradient_as_bucket_view(self, bucket_view: bool) -> Self

Sets whether to use gradient bucketing.

Source

pub fn module(&self) -> &M

Returns a reference to the underlying module.

Source

pub fn module_mut(&mut self) -> &mut M

Returns a mutable reference to the underlying module.

Source

pub fn process_group(&self) -> &ProcessGroup

Returns the process group.

Source

pub fn sync_parameters(&mut self)

Synchronizes model parameters across all processes. Should be called once at the start of training to ensure all ranks start from identical parameters (broadcast from rank 0).

Source

pub fn sync_gradients(&self)

Synchronizes gradients across all processes. Should be called after the backward pass. All-reduces gradients so every rank gets the average gradient across all ranks.

Source

pub fn forward(&self, input: &Variable) -> Variable

Performs forward pass with gradient synchronization.

Trait Implementations§

Source §

impl<M: Module> Module for DistributedDataParallel<M>

Source §

fn forward(&self, input: &Variable) -> Variable

Performs the forward pass. Read more

Source §

fn parameters(&self) -> Vec<Parameter>

Returns all parameters of this module. Read more

Source §

fn train(&mut self)

Sets the module to training mode.

Source §

fn eval(&mut self)

Sets the module to evaluation mode.

Source §

fn is_training(&self) -> bool

Returns whether the module is in training mode. Read more

Source §

fn named_parameters(&self) -> HashMap<String, Parameter>

Returns named parameters of this module.

Source §

fn num_parameters(&self) -> usize

Returns the number of trainable parameters.

Source §

fn set_training(&mut self, _training: bool)

Sets the training mode. Sets the training mode. Read more

Source §

fn zero_grad(&self)

Zeros all gradients of parameters.

Source §

fn to_device(&self, device: Device)

Moves all parameters to the specified device. Read more

Source §

fn name(&self) -> &'static str

Returns the module name for debugging.

Auto Trait Implementations§

§

impl<M> !UnwindSafe for DistributedDataParallel<M>

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> IntoEither for T

Source §

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more

Source §

impl<T> Pointable for T

Source §

const ALIGN: usize

The alignment of pointer.

Source §

type Init = T

The type for initializers.

Source §

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

Source §

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

Source §

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

Source §

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

Struct DistributedDataParallel Copy item path

Implementations§

impl<M: Module> DistributedDataParallel<M>

pub fn new(module: M, process_group: ProcessGroup) -> Self

pub fn broadcast_buffers(self, broadcast: bool) -> Self

pub fn gradient_as_bucket_view(self, bucket_view: bool) -> Self

pub fn module(&self) -> &M

pub fn module_mut(&mut self) -> &mut M

pub fn process_group(&self) -> &ProcessGroup

pub fn sync_parameters(&mut self)

pub fn sync_gradients(&self)

pub fn forward(&self, input: &Variable) -> Variable

Trait Implementations§

impl<M: Module> Module for DistributedDataParallel<M>

fn forward(&self, input: &Variable) -> Variable

fn parameters(&self) -> Vec<Parameter>

fn train(&mut self)

fn eval(&mut self)

fn is_training(&self) -> bool

fn named_parameters(&self) -> HashMap<String, Parameter>

fn num_parameters(&self) -> usize

fn set_training(&mut self, _training: bool)

fn zero_grad(&self)

fn to_device(&self, device: Device)

fn name(&self) -> &'static str

Auto Trait Implementations§

impl<M> Freeze for DistributedDataParallel<M>where M: Freeze,

impl<M> !RefUnwindSafe for DistributedDataParallel<M>

impl<M> Send for DistributedDataParallel<M>

impl<M> Sync for DistributedDataParallel<M>

impl<M> Unpin for DistributedDataParallel<M>where M: Unpin,

impl<M> UnsafeUnpin for DistributedDataParallel<M>where M: UnsafeUnpin,

impl<M> !UnwindSafe for DistributedDataParallel<M>

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct DistributedDataParallel

impl<M> Freeze for DistributedDataParallel<M>
where M: Freeze,

impl<M> Unpin for DistributedDataParallel<M>
where M: Unpin,

impl<M> UnsafeUnpin for DistributedDataParallel<M>
where M: UnsafeUnpin,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,