Trait relearn::agents::BatchUpdate

source · [−]

pub trait BatchUpdate<O, A> {
    type Feedback;
    type HistoryBuffer: WriteExperience<O, A, Self::Feedback>;

    fn buffer(&self) -> Self::HistoryBuffer;
    fn min_update_size(&self) -> HistoryDataBound;
    fn batch_update<'a, I>(&mut self, buffers: I, logger: &mut dyn StatsLogger)
    where
        I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
        Self::HistoryBuffer: 'a;
}

Expand description

Update an agent with steps collected into history buffers.

The user is only responsible for adding data to the history buffer. If old data in the buffer needs to be cleared that is the reponsibility of either the buffer or the batch_update method.

Required Associated Types

source

type Feedback

Environment feedback type

source

type HistoryBuffer: WriteExperience<O, A, Self::Feedback>

Required Methods

source

fn buffer(&self) -> Self::HistoryBuffer

Create a new history buffer.

source

fn min_update_size(&self) -> HistoryDataBound

Request a minimum amount of on-policy data for the next batch update.

source

fn batch_update<'a, I>(&mut self, buffers: I, logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

Update the agent from a collection of history buffers.

All new data inserted into the buffers since the last call must be on-policy.

It is preferable but not required for the last step of the newly added data to end its episode — either by termination or interruption. If instead the last step.next is Successor::Continue then that one step may be dropped or ignored by agents that depend on well-formed step successors.

This function and the history buffer itself are jointly reponsible for managing the data within the buffer. The buffers may be emptied by the call.

Implementation Note

This iterator-generic batch_update is necessary because some agents modify the given buffer references before passing to batch_update of an inner agent. This would not work if the inner agent only took a slice of buffers.

Implementations on Foreign Types

source

impl BatchUpdate<usize, usize> for Arc<BaseUCB1Agent>

type Feedback = Reward

fn batch_update<'a, I>(&mut self, buffers: I, _logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

source

impl<TC, OS, AS, FS> BatchUpdate<MetaObservation<<OS as Space>::Element, <AS as Space>::Element, <FS as Space>::Element>, <AS as Space>::Element> for Arc<ResettingMetaAgent<TC, OS, AS, FS>> where
    OS: Space,
    AS: Space,
    FS: Space,

No updates at the meta-level.

type Feedback = <FS as Space>::Element

type HistoryBuffer = NullBuffer

source

fn buffer(&self) -> Self::HistoryBuffer

source

fn min_update_size(&self) -> HistoryDataBound

source

fn batch_update<'a, I>(&mut self, _buffers: I, _logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

Implementors

source

impl<O, AS: Space> BatchUpdate<O, <AS as Space>::Element> for RandomAgent<AS>

type Feedback = Reward

type HistoryBuffer = NullBuffer

source

impl<OS, AS, P, C> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for ActorCriticAgent<OS, AS, P, C> where
    OS: FeatureSpace,
    OS::Element: 'static,
    AS: ParameterizedDistributionSpace<Tensor>,
    AS::Element: 'static,
    P: Policy,
    C: Critic,

type Feedback = Reward

type HistoryBuffer = VecBuffer<<OS as Space>::Element, <AS as Space>::Element, Reward>

source

impl<OS, AS, V, O> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for DqnAgent<OS, AS, V, O> where
    OS: FeatureSpace,
    OS::Element: 'static,
    AS: FiniteSpace + ReprSpace<Tensor>,
    AS::Element: 'static,
    V: AsModule,
    V::Module: SeqPacked,
    O: Optimizer,

type Feedback = Reward

type HistoryBuffer = ReplayBuffer<<OS as Space>::Element, <AS as Space>::Element, Reward>

source

impl<T0, T1, O0, O1, A0, A1> BatchUpdate<(O0, O1), (A0, A1)> for AgentPair<T0, T1> where
    T0: BatchUpdate<O0, A0>,
    T1: BatchUpdate<O1, A1>,
    T0::HistoryBuffer: 'static,
    T1::HistoryBuffer: 'static,

type Feedback = (<T0 as BatchUpdate<O0, A0>>::Feedback, <T1 as BatchUpdate<O1, A1>>::Feedback)

type HistoryBuffer = HistoryBufferPair<<T0 as BatchUpdate<O0, A0>>::HistoryBuffer, <T1 as BatchUpdate<O1, A1>>::HistoryBuffer>

source

impl<T, OS, AS> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for FiniteSpaceAgent<T, OS, AS> where
    T: BatchUpdate<usize, usize>,
    OS: FiniteSpace + Clone + 'static,
    AS: FiniteSpace + Clone + 'static,
    T::Feedback: Clone,
    T::HistoryBuffer: 'static,

Trait relearn::agents::BatchUpdate

Required Associated Types

type Feedback

type HistoryBuffer: WriteExperience<O, A, Self::Feedback>

Required Methods

fn buffer(&self) -> Self::HistoryBuffer

fn min_update_size(&self) -> HistoryDataBound

fn batch_update<'a, I>(&mut self, buffers: I, logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

Implementation Note

Implementations on Foreign Types

impl BatchUpdate<usize, usize> for Arc<BaseUCB1Agent>

type Feedback = Reward

type HistoryBuffer = VecBuffer<usize, usize, Reward>

fn buffer(&self) -> Self::HistoryBuffer

fn min_update_size(&self) -> HistoryDataBound

fn batch_update<'a, I>(&mut self, buffers: I, _logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

impl<TC, OS, AS, FS> BatchUpdate<MetaObservation<<OS as Space>::Element, <AS as Space>::Element, <FS as Space>::Element>, <AS as Space>::Element> for Arc<ResettingMetaAgent<TC, OS, AS, FS>> where
    OS: Space,
    AS: Space,
    FS: Space,

type Feedback = <FS as Space>::Element

type HistoryBuffer = NullBuffer

fn buffer(&self) -> Self::HistoryBuffer

fn min_update_size(&self) -> HistoryDataBound

fn batch_update<'a, I>(&mut self, _buffers: I, _logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

Implementors

impl<O, AS: Space> BatchUpdate<O, <AS as Space>::Element> for RandomAgent<AS>

type Feedback = Reward

type HistoryBuffer = NullBuffer

impl<OS, AS, P, C> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for ActorCriticAgent<OS, AS, P, C> where
    OS: FeatureSpace,
    OS::Element: 'static,
    AS: ParameterizedDistributionSpace<Tensor>,
    AS::Element: 'static,
    P: Policy,
    C: Critic,

type Feedback = Reward

type HistoryBuffer = VecBuffer<<OS as Space>::Element, <AS as Space>::Element, Reward>

impl<OS, AS, V, O> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for DqnAgent<OS, AS, V, O> where
    OS: FeatureSpace,
    OS::Element: 'static,
    AS: FiniteSpace + ReprSpace<Tensor>,
    AS::Element: 'static,
    V: AsModule,
    V::Module: SeqPacked,
    O: Optimizer,

type Feedback = Reward

type HistoryBuffer = ReplayBuffer<<OS as Space>::Element, <AS as Space>::Element, Reward>

impl<T0, T1, O0, O1, A0, A1> BatchUpdate<(O0, O1), (A0, A1)> for AgentPair<T0, T1> where
    T0: BatchUpdate<O0, A0>,
    T1: BatchUpdate<O1, A1>,
    T0::HistoryBuffer: 'static,
    T1::HistoryBuffer: 'static,

type Feedback = (<T0 as BatchUpdate<O0, A0>>::Feedback, <T1 as BatchUpdate<O1, A1>>::Feedback)

type HistoryBuffer = HistoryBufferPair<<T0 as BatchUpdate<O0, A0>>::HistoryBuffer, <T1 as BatchUpdate<O1, A1>>::HistoryBuffer>

impl<T, OS, AS> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for FiniteSpaceAgent<T, OS, AS> where
    T: BatchUpdate<usize, usize>,
    OS: FiniteSpace + Clone + 'static,
    AS: FiniteSpace + Clone + 'static,
    T::Feedback: Clone,
    T::HistoryBuffer: 'static,

type Feedback = <T as BatchUpdate<usize, usize>>::Feedback

type HistoryBuffer = FiniteSpaceBuffer<<T as BatchUpdate<usize, usize>>::HistoryBuffer, OS, AS>

Trait relearn::agents::BatchUpdate

Required Associated Types

type Feedback

type HistoryBuffer: WriteExperience<O, A, Self::Feedback>

Required Methods

fn buffer(&self) -> Self::HistoryBuffer

fn min_update_size(&self) -> HistoryDataBound

fn batch_update<'a, I>(&mut self, buffers: I, logger: &mut dyn StatsLogger) where I: IntoIterator<Item = &'a mut Self::HistoryBuffer>, Self::HistoryBuffer: 'a,

Implementation Note

Implementations on Foreign Types

impl BatchUpdate<usize, usize> for Arc<BaseUCB1Agent>

type Feedback = Reward

type HistoryBuffer = VecBuffer<usize, usize, Reward>

fn buffer(&self) -> Self::HistoryBuffer

fn min_update_size(&self) -> HistoryDataBound

fn batch_update<'a, I>(&mut self, buffers: I, _logger: &mut dyn StatsLogger) where I: IntoIterator<Item = &'a mut Self::HistoryBuffer>, Self::HistoryBuffer: 'a,

impl<TC, OS, AS, FS> BatchUpdate<MetaObservation<<OS as Space>::Element, <AS as Space>::Element, <FS as Space>::Element>, <AS as Space>::Element> for Arc<ResettingMetaAgent<TC, OS, AS, FS>> where OS: Space, AS: Space, FS: Space,

type Feedback = <FS as Space>::Element

type HistoryBuffer = NullBuffer

fn buffer(&self) -> Self::HistoryBuffer

fn min_update_size(&self) -> HistoryDataBound

fn batch_update<'a, I>(&mut self, _buffers: I, _logger: &mut dyn StatsLogger) where I: IntoIterator<Item = &'a mut Self::HistoryBuffer>, Self::HistoryBuffer: 'a,

Implementors

impl<O, AS: Space> BatchUpdate<O, <AS as Space>::Element> for RandomAgent<AS>

type Feedback = Reward

type HistoryBuffer = NullBuffer

impl<OS, AS, P, C> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for ActorCriticAgent<OS, AS, P, C> where OS: FeatureSpace, OS::Element: 'static, AS: ParameterizedDistributionSpace<Tensor>, AS::Element: 'static, P: Policy, C: Critic,

type Feedback = Reward

type HistoryBuffer = VecBuffer<<OS as Space>::Element, <AS as Space>::Element, Reward>

impl<OS, AS, V, O> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for DqnAgent<OS, AS, V, O> where OS: FeatureSpace, OS::Element: 'static, AS: FiniteSpace + ReprSpace<Tensor>, AS::Element: 'static, V: AsModule, V::Module: SeqPacked, O: Optimizer,

type Feedback = Reward

type HistoryBuffer = ReplayBuffer<<OS as Space>::Element, <AS as Space>::Element, Reward>

impl<T0, T1, O0, O1, A0, A1> BatchUpdate<(O0, O1), (A0, A1)> for AgentPair<T0, T1> where T0: BatchUpdate<O0, A0>, T1: BatchUpdate<O1, A1>, T0::HistoryBuffer: 'static, T1::HistoryBuffer: 'static,

type Feedback = (<T0 as BatchUpdate<O0, A0>>::Feedback, <T1 as BatchUpdate<O1, A1>>::Feedback)

type HistoryBuffer = HistoryBufferPair<<T0 as BatchUpdate<O0, A0>>::HistoryBuffer, <T1 as BatchUpdate<O1, A1>>::HistoryBuffer>

impl<T, OS, AS> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for FiniteSpaceAgent<T, OS, AS> where T: BatchUpdate<usize, usize>, OS: FiniteSpace + Clone + 'static, AS: FiniteSpace + Clone + 'static, T::Feedback: Clone, T::HistoryBuffer: 'static,

type Feedback = <T as BatchUpdate<usize, usize>>::Feedback

type HistoryBuffer = FiniteSpaceBuffer<<T as BatchUpdate<usize, usize>>::HistoryBuffer, OS, AS>

fn batch_update<'a, I>(&mut self, buffers: I, logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

fn batch_update<'a, I>(&mut self, buffers: I, _logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

impl<TC, OS, AS, FS> BatchUpdate<MetaObservation<<OS as Space>::Element, <AS as Space>::Element, <FS as Space>::Element>, <AS as Space>::Element> for Arc<ResettingMetaAgent<TC, OS, AS, FS>> where
OS: Space,
AS: Space,
FS: Space,

fn batch_update<'a, I>(&mut self, _buffers: I, _logger: &mut dyn StatsLogger) where
I: IntoIterator<Item = &'a mut Self::HistoryBuffer>,
Self::HistoryBuffer: 'a,

impl<OS, AS, P, C> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for ActorCriticAgent<OS, AS, P, C> where
OS: FeatureSpace,
OS::Element: 'static,
AS: ParameterizedDistributionSpace<Tensor>,
AS::Element: 'static,
P: Policy,
C: Critic,

impl<OS, AS, V, O> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for DqnAgent<OS, AS, V, O> where
OS: FeatureSpace,
OS::Element: 'static,
AS: FiniteSpace + ReprSpace<Tensor>,
AS::Element: 'static,
V: AsModule,
V::Module: SeqPacked,
O: Optimizer,

impl<T0, T1, O0, O1, A0, A1> BatchUpdate<(O0, O1), (A0, A1)> for AgentPair<T0, T1> where
T0: BatchUpdate<O0, A0>,
T1: BatchUpdate<O1, A1>,
T0::HistoryBuffer: 'static,
T1::HistoryBuffer: 'static,

impl<T, OS, AS> BatchUpdate<<OS as Space>::Element, <AS as Space>::Element> for FiniteSpaceAgent<T, OS, AS> where
T: BatchUpdate<usize, usize>,
OS: FiniteSpace + Clone + 'static,
AS: FiniteSpace + Clone + 'static,
T::Feedback: Clone,
T::HistoryBuffer: 'static,