Struct border_core::Trainer

source · [−]

pub struct Trainer<E, P, R> where
    E: Env,
    P: StepProcessorBase<E>,
    R: ReplayBufferBase<PushedItem = P::Output>,  {
    pub env_config_train: E::Config,
    pub env_config_eval: Option<E::Config>,
    pub step_proc_config: P::Config,
    pub replay_buffer_config: R::Config,
    pub model_dir: Option<String>,
    pub opt_interval: usize,
    pub record_interval: usize,
    pub eval_interval: usize,
    pub save_interval: usize,
    pub max_opts: usize,
    pub eval_episodes: usize,
}

Expand description

Manages training loop and related objects.

Fields

env_config_train: E::Config

Configuration of the environment for training.

env_config_eval: Option<E::Config>

Configuration of the environment for evaluation.

If None, env_config_train is used.

step_proc_config: P::Config

Configuration of the transition producer.

replay_buffer_config: R::Config

Configuration of the replay buffer.

model_dir: Option<String>

Where to save the trained model.

opt_interval: usize

Interval of optimization in environment steps.

record_interval: usize

Interval of recording in optimization steps.

eval_interval: usize

Interval of evaluation in optimization steps.

save_interval: usize

Interval of saving the model in optimization steps.

max_opts: usize

The maximal number of optimization steps.

eval_episodes: usize

The number of episodes for evaluation.

Implementations

source

impl<E, P, R> Trainer<E, P, R> where
 E: Env,
 P: StepProcessorBase<E>,
 R: ReplayBufferBase<PushedItem = P::Output>,

source

pub fn build(
 config: TrainerConfig,
 env_config_train: E::Config,
 env_config_eval: Option<E::Config>,
 step_proc_config: P::Config,
 replay_buffer_config: R::Config
) -> Self

Constructs a trainer.

source

pub fn train_step<A: Agent<E, R>>(
 &self,
 agent: &mut A,
 buffer: &mut R,
 sampler: &mut SyncSampler<E, P>,
 env_steps: &mut usize
) -> Result<(Option<Record>, Option<Duration>)> where
 A: Agent<E, R>,

Performs a training step.

source

pub fn train<A, S>(&mut self, agent: &mut A, recorder: &mut S) -> Result<()> where
A: Agent<E, R>,
S: Recorder,

Train the agent.

Auto Trait Implementations

impl<E, P, R> RefUnwindSafe for Trainer<E, P, R> where
 <E as Env>::Config: RefUnwindSafe,
 >::Config: RefUnwindSafe,
 <R as ReplayBufferBase>::Config: RefUnwindSafe,

impl<E, P, R> Send for Trainer<E, P, R> where
 <E as Env>::Config: Send,
 >::Config: Send,
 <R as ReplayBufferBase>::Config: Send,

impl<E, P, R> Sync for Trainer<E, P, R> where
 <E as Env>::Config: Sync,
 >::Config: Sync,
 <R as ReplayBufferBase>::Config: Sync,

impl<E, P, R> Unpin for Trainer<E, P, R> where
 <E as Env>::Config: Unpin,
 >::Config: Unpin,
 <R as ReplayBufferBase>::Config: Unpin,

impl<E, P, R> UnwindSafe for Trainer<E, P, R> where
 <E as Env>::Config: UnwindSafe,
 >::Config: UnwindSafe,
 <R as ReplayBufferBase>::Config: UnwindSafe,

Blanket Implementations

source

impl<T> Any for T where
T: 'static + ?Sized,

source

pub fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

source

impl<T> Borrow<T> for T where
T: ?Sized,

const: unstable · source

pub fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

source

impl<T> BorrowMut<T> for T where
T: ?Sized,

const: unstable · source

pub fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

source

impl<T> From<T> for T

const: unstable · source

pub fn from(t: T) -> T

Performs the conversion.

source

impl<T, U> Into for T where
U: From<T>,

const: unstable · source

pub fn into(self) -> U

Performs the conversion.

impl<T> Pointable for T

pub const ALIGN: usize

The alignment of pointer.

type Init = T

The type for initializers.

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

pub unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

source

impl<T, U> TryFrom for T where
U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

const: unstable · source

pub fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

source

impl<T, U> TryInto for T where
U: TryFrom<T>,

type Error = >::Error

The type returned in the event of a conversion error.

const: unstable · source

pub fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct border_core::Trainer

Fields

Implementations

impl<E, P, R> Trainer<E, P, R> where
    E: Env,
    P: StepProcessorBase<E>,
    R: ReplayBufferBase<PushedItem = P::Output>,

pub fn build(
    config: TrainerConfig,
    env_config_train: E::Config,
    env_config_eval: Option<E::Config>,
    step_proc_config: P::Config,
    replay_buffer_config: R::Config
) -> Self

pub fn train_step<A: Agent<E, R>>(
    &self,
    agent: &mut A,
    buffer: &mut R,
    sampler: &mut SyncSampler<E, P>,
    env_steps: &mut usize
) -> Result<(Option<Record>, Option<Duration>)> where
    A: Agent<E, R>,

pub fn train<A, S>(&mut self, agent: &mut A, recorder: &mut S) -> Result<()> where
A: Agent<E, R>,
S: Recorder,

Auto Trait Implementations

impl<E, P, R> RefUnwindSafe for Trainer<E, P, R> where
    <E as Env>::Config: RefUnwindSafe,
    <P as StepProcessorBase<E>>::Config: RefUnwindSafe,
    <R as ReplayBufferBase>::Config: RefUnwindSafe,

impl<E, P, R> Send for Trainer<E, P, R> where
    <E as Env>::Config: Send,
    <P as StepProcessorBase<E>>::Config: Send,
    <R as ReplayBufferBase>::Config: Send,

impl<E, P, R> Sync for Trainer<E, P, R> where
    <E as Env>::Config: Sync,
    <P as StepProcessorBase<E>>::Config: Sync,
    <R as ReplayBufferBase>::Config: Sync,

impl<E, P, R> Unpin for Trainer<E, P, R> where
    <E as Env>::Config: Unpin,
    <P as StepProcessorBase<E>>::Config: Unpin,
    <R as ReplayBufferBase>::Config: Unpin,

impl<E, P, R> UnwindSafe for Trainer<E, P, R> where
    <E as Env>::Config: UnwindSafe,
    <P as StepProcessorBase<E>>::Config: UnwindSafe,
    <R as ReplayBufferBase>::Config: UnwindSafe,

Blanket Implementations

impl<T> Any for T where
T: 'static + ?Sized,

pub fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where
T: ?Sized,

pub fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where
T: ?Sized,

pub fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

pub fn from(t: T) -> T

impl<T, U> Into<U> for T where
U: From<T>,

pub fn into(self) -> U

impl<T> Pointable for T

pub const ALIGN: usize

type Init = T

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

pub unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for T where
U: Into<T>,

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for T where
V: MultiLane<T>,

pub fn vzip(self) -> V

Struct border_core::Trainer

Fields

Implementations

impl<E, P, R> Trainer<E, P, R> where E: Env, P: StepProcessorBase<E>, R: ReplayBufferBase<PushedItem = P::Output>,

pub fn build( config: TrainerConfig, env_config_train: E::Config, env_config_eval: Option<E::Config>, step_proc_config: P::Config, replay_buffer_config: R::Config) -> Self

pub fn train_step<A: Agent<E, R>>( &self, agent: &mut A, buffer: &mut R, sampler: &mut SyncSampler<E, P>, env_steps: &mut usize) -> Result<(Option<Record>, Option<Duration>)> where A: Agent<E, R>,

pub fn train<A, S>(&mut self, agent: &mut A, recorder: &mut S) -> Result<()> where A: Agent<E, R>, S: Recorder,

Auto Trait Implementations

impl<E, P, R> RefUnwindSafe for Trainer<E, P, R> where <E as Env>::Config: RefUnwindSafe, <P as StepProcessorBase<E>>::Config: RefUnwindSafe, <R as ReplayBufferBase>::Config: RefUnwindSafe,

impl<E, P, R> Send for Trainer<E, P, R> where <E as Env>::Config: Send, <P as StepProcessorBase<E>>::Config: Send, <R as ReplayBufferBase>::Config: Send,

impl<E, P, R> Sync for Trainer<E, P, R> where <E as Env>::Config: Sync, <P as StepProcessorBase<E>>::Config: Sync, <R as ReplayBufferBase>::Config: Sync,

impl<E, P, R> Unpin for Trainer<E, P, R> where <E as Env>::Config: Unpin, <P as StepProcessorBase<E>>::Config: Unpin, <R as ReplayBufferBase>::Config: Unpin,

impl<E, P, R> UnwindSafe for Trainer<E, P, R> where <E as Env>::Config: UnwindSafe, <P as StepProcessorBase<E>>::Config: UnwindSafe, <R as ReplayBufferBase>::Config: UnwindSafe,

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

pub fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where T: ?Sized,

pub fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

pub fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

pub fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

pub fn into(self) -> U

impl<T> Pointable for T

pub const ALIGN: usize

type Init = T

pub unsafe fn init(init: <T as Pointable>::Init) -> usize

pub unsafe fn deref<'a>(ptr: usize) -> &'a T

pub unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

pub unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for T where V: MultiLane<T>,

pub fn vzip(self) -> V

impl<E, P, R> Trainer<E, P, R> where
E: Env,
P: StepProcessorBase<E>,
R: ReplayBufferBase<PushedItem = P::Output>,

pub fn build(
config: TrainerConfig,
env_config_train: E::Config,
env_config_eval: Option<E::Config>,
step_proc_config: P::Config,
replay_buffer_config: R::Config
) -> Self

pub fn train_step<A: Agent<E, R>>(
&self,
agent: &mut A,
buffer: &mut R,
sampler: &mut SyncSampler<E, P>,
env_steps: &mut usize
) -> Result<(Option<Record>, Option<Duration>)> where
A: Agent<E, R>,

pub fn train<A, S>(&mut self, agent: &mut A, recorder: &mut S) -> Result<()> where
A: Agent<E, R>,
S: Recorder,

impl<E, P, R> RefUnwindSafe for Trainer<E, P, R> where
<E as Env>::Config: RefUnwindSafe,
<P as StepProcessorBase<E>>::Config: RefUnwindSafe,
<R as ReplayBufferBase>::Config: RefUnwindSafe,

impl<E, P, R> Send for Trainer<E, P, R> where
<E as Env>::Config: Send,
<P as StepProcessorBase<E>>::Config: Send,
<R as ReplayBufferBase>::Config: Send,

impl<E, P, R> Sync for Trainer<E, P, R> where
<E as Env>::Config: Sync,
<P as StepProcessorBase<E>>::Config: Sync,
<R as ReplayBufferBase>::Config: Sync,

impl<E, P, R> Unpin for Trainer<E, P, R> where
<E as Env>::Config: Unpin,
<P as StepProcessorBase<E>>::Config: Unpin,
<R as ReplayBufferBase>::Config: Unpin,

impl<E, P, R> UnwindSafe for Trainer<E, P, R> where
<E as Env>::Config: UnwindSafe,
<P as StepProcessorBase<E>>::Config: UnwindSafe,
<R as ReplayBufferBase>::Config: UnwindSafe,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

impl<V, T> VZip<V> for T where
V: MultiLane<T>,