Struct border_async_trainer::AsyncTrainer

source ·

pub struct AsyncTrainer<A, E, R>where
    A: Agent<E, R> + SyncModel,
    E: Env,
    R: ReplayBufferBase,
    R::PushedItem: Send + 'static,{ /* private fields */ }

Expand description

Manages asynchronous training loop in a single machine.

It interacts with ActorManager as shown below:

In ActorManager (right), Actors sample transitions, which have type ReplayBufferBase::PushedItem, in parallel and push the transitions into ReplayBufferProxy. It should be noted that ReplayBufferProxy has a type parameter of ReplayBufferBase and the proxy accepts ReplayBufferBase::PushedItem.
The proxy sends the transitions into the replay buffer, implementing ReplayBufferBase, in the AsyncTrainer.
The Agent in AsyncTrainer trains its model parameters by using batches of type ReplayBufferBase::Batch, which are taken from the replay buffer.
The model parameters of the Agent in AsyncTrainer are wrapped in SyncModel::ModelInfo and periodically sent to the Agents in Actors. Agent must implement SyncModel to synchronize its model.

Struct border_async_trainer::AsyncTrainer

Implementations§

impl<A, E, R> AsyncTrainer<A, E, R>where A: Agent<E, R> + SyncModel, E: Env, R: ReplayBufferBase, R::PushedItem: Send + 'static,

pub fn build( config: &AsyncTrainerConfig, agent_config: &A::Config, env_config: &E::Config, replay_buffer_config: &R::Config, r_bulk_pushed_item: Receiver<PushedItemMessage<R::PushedItem>>, model_info_sender: Sender<(usize, A::ModelInfo)>, stop: Arc<Mutex<bool>> ) -> Self

pub fn train<D>( &mut self, recorder: &mut impl Recorder, evaluator: &mut D, guard_init_env: Arc<Mutex<bool>> ) -> AsyncTrainStatwhere D: Evaluator<E, A>,

Auto Trait Implementations§

impl<A, E, R> RefUnwindSafe for AsyncTrainer<A, E, R>where A: RefUnwindSafe, E: RefUnwindSafe, R: RefUnwindSafe, <A as Policy<E>>::Config: RefUnwindSafe, <E as Env>::Config: RefUnwindSafe, <R as ReplayBufferBase>::Config: RefUnwindSafe,

impl<A, E, R> Send for AsyncTrainer<A, E, R>where A: Send, E: Send, R: Send, <A as Policy<E>>::Config: Send, <E as Env>::Config: Send, <R as ReplayBufferBase>::Config: Send, <A as SyncModel>::ModelInfo: Send,

impl<A, E, R> Sync for AsyncTrainer<A, E, R>where A: Sync, E: Sync, R: Sync, <A as Policy<E>>::Config: Sync, <E as Env>::Config: Sync, <R as ReplayBufferBase>::Config: Sync, <A as SyncModel>::ModelInfo: Send,

impl<A, E, R> Unpin for AsyncTrainer<A, E, R>where A: Unpin, E: Unpin, R: Unpin, <A as Policy<E>>::Config: Unpin, <E as Env>::Config: Unpin, <R as ReplayBufferBase>::Config: Unpin, <R as ExperienceBufferBase>::PushedItem: Unpin,

impl<A, E, R> UnwindSafe for AsyncTrainer<A, E, R>where A: UnwindSafe, E: UnwindSafe, R: UnwindSafe, <A as Policy<E>>::Config: UnwindSafe, <E as Env>::Config: UnwindSafe, <R as ReplayBufferBase>::Config: UnwindSafe,

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> Pointable for T

const ALIGN: usize = _

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V