Struct AsyncTrainer

Source

pub struct AsyncTrainer<A, E, R>where
    A: Agent<E, R> + Configurable + SyncModel,
    E: Env,
    R: ExperienceBufferBase + ReplayBufferBase,
    R::Item: Send + 'static,
{ /* private fields */ }

Expand description

Manages asynchronous training loop in a single machine.

It interacts with ActorManager as shown below:

The Agent in AsyncTrainer (left) is trained with batches of type ReplayBufferBase::Batch, which are taken from the replay buffer.
The model parameters of the Agent in AsyncTrainer are wrapped in SyncModel::ModelInfo and periodically sent to the Agents in Actors. Agent must implement SyncModel to synchronize the model parameters.
In ActorManager (right), Actors sample transitions, which have type ReplayBufferBase::Item, and push the transitions into ReplayBufferProxy.
ReplayBufferProxy has a type parameter of ReplayBufferBase and the proxy accepts ReplayBufferBase::Item.
The proxy sends the transitions into the replay buffer in the AsyncTrainer.

Struct AsyncTrainerCopy item path

Implementations§

impl<A, E, R> AsyncTrainer<A, E, R>where A: Agent<E, R> + Configurable + SyncModel + 'static, E: Env, R: ExperienceBufferBase + ReplayBufferBase, R::Item: Send + 'static,

pub fn build( config: &AsyncTrainerConfig, agent_config: &A::Config, env_config: &E::Config, replay_buffer_config: &R::Config, r_bulk_pushed_item: Receiver<PushedItemMessage<R::Item>>, model_info_sender: Sender<(usize, A::ModelInfo)>, stop: Arc<Mutex<bool>>, ) -> Self

pub fn train<D>( &mut self, recorder: &mut Box<dyn Recorder<E, R>>, evaluator: &mut D, guard_init_env: Arc<Mutex<bool>>, ) -> AsyncTrainStatwhere D: Evaluator<E>,

Auto Trait Implementations§

impl<A, E, R> Freeze for AsyncTrainer<A, E, R>where <E as Env>::Config: Freeze, <R as ReplayBufferBase>::Config: Freeze, <A as Configurable>::Config: Freeze,

impl<A, E, R> RefUnwindSafe for AsyncTrainer<A, E, R>where <E as Env>::Config: RefUnwindSafe, <R as ReplayBufferBase>::Config: RefUnwindSafe, <A as Configurable>::Config: RefUnwindSafe, A: RefUnwindSafe, E: RefUnwindSafe, R: RefUnwindSafe,

impl<A, E, R> Send for AsyncTrainer<A, E, R>where <E as Env>::Config: Send, <R as ReplayBufferBase>::Config: Send, <A as Configurable>::Config: Send, <A as SyncModel>::ModelInfo: Send, A: Send, E: Send, R: Send,

impl<A, E, R> Sync for AsyncTrainer<A, E, R>where <E as Env>::Config: Sync, <R as ReplayBufferBase>::Config: Sync, <A as Configurable>::Config: Sync, <A as SyncModel>::ModelInfo: Send, A: Sync, E: Sync, R: Sync,

impl<A, E, R> Unpin for AsyncTrainer<A, E, R>where <E as Env>::Config: Unpin, <R as ReplayBufferBase>::Config: Unpin, <A as Configurable>::Config: Unpin, A: Unpin, E: Unpin, R: Unpin, <R as ExperienceBufferBase>::Item: Unpin,

impl<A, E, R> UnwindSafe for AsyncTrainer<A, E, R>where <E as Env>::Config: UnwindSafe, <R as ReplayBufferBase>::Config: UnwindSafe, <A as Configurable>::Config: UnwindSafe, A: UnwindSafe, E: UnwindSafe, R: UnwindSafe,

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct AsyncTrainer

impl<A, E, R> AsyncTrainer<A, E, R>
where A: Agent<E, R> + Configurable + SyncModel + 'static, E: Env, R: ExperienceBufferBase + ReplayBufferBase, R::Item: Send + 'static,

pub fn train<D>( &mut self, recorder: &mut Box<dyn Recorder<E, R>>, evaluator: &mut D, guard_init_env: Arc<Mutex<bool>>, ) -> AsyncTrainStat
where D: Evaluator<E>,

impl<A, E, R> Freeze for AsyncTrainer<A, E, R>
where <E as Env>::Config: Freeze, <R as ReplayBufferBase>::Config: Freeze, <A as Configurable>::Config: Freeze,

impl<A, E, R> RefUnwindSafe for AsyncTrainer<A, E, R>
where <E as Env>::Config: RefUnwindSafe, <R as ReplayBufferBase>::Config: RefUnwindSafe, <A as Configurable>::Config: RefUnwindSafe, A: RefUnwindSafe, E: RefUnwindSafe, R: RefUnwindSafe,

impl<A, E, R> Send for AsyncTrainer<A, E, R>
where <E as Env>::Config: Send, <R as ReplayBufferBase>::Config: Send, <A as Configurable>::Config: Send, <A as SyncModel>::ModelInfo: Send, A: Send, E: Send, R: Send,

impl<A, E, R> Sync for AsyncTrainer<A, E, R>
where <E as Env>::Config: Sync, <R as ReplayBufferBase>::Config: Sync, <A as Configurable>::Config: Sync, <A as SyncModel>::ModelInfo: Send, A: Sync, E: Sync, R: Sync,

impl<A, E, R> Unpin for AsyncTrainer<A, E, R>
where <E as Env>::Config: Unpin, <R as ReplayBufferBase>::Config: Unpin, <A as Configurable>::Config: Unpin, A: Unpin, E: Unpin, R: Unpin, <R as ExperienceBufferBase>::Item: Unpin,

impl<A, E, R> UnwindSafe for AsyncTrainer<A, E, R>
where <E as Env>::Config: UnwindSafe, <R as ReplayBufferBase>::Config: UnwindSafe, <A as Configurable>::Config: UnwindSafe, A: UnwindSafe, E: UnwindSafe, R: UnwindSafe,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,