Struct PrioritizedReplayBuffer

Source

pub struct PrioritizedReplayBuffer { /* private fields */ }

Expand description

Prioritized Experience Replay buffer with proportional priority and IS weights.

Implementations§

Source §

impl PrioritizedReplayBuffer

Source

pub fn new( capacity: usize, obs_dim: usize, act_dim: usize, alpha: f64, beta_start: f64, ) -> Self

Create a PER buffer.

capacity — maximum number of transitions.
obs_dim, act_dim — observation / action dimensions.
alpha — priority exponent (default 0.6).
beta_start — initial IS exponent (default 0.4, annealed to 1).

Source

pub fn push( &mut self, obs: impl AsRef<[f32]>, action: impl AsRef<[f32]>, reward: f32, next_obs: impl AsRef<[f32]>, done: bool, )

Push a transition with maximum priority (so it will be sampled at least once).

Source

pub fn update_priority(&mut self, index: usize, priority: f64)

Update priority for a transition that was previously sampled.

§Arguments

index — the buffer index returned in PrioritySample::index.
priority — new absolute priority (typically |TD error| + ε).

Source

pub fn set_beta(&mut self, beta: f64)

Set the current β for IS weight computation.

Source

pub fn anneal_beta(&mut self, step: f64)

Anneal β toward 1 by step (additive).

Source

pub fn len(&self) -> usize

Number of stored transitions.

Source

pub fn is_empty(&self) -> bool

Returns true if empty.

Source

pub fn sample( &self, batch_size: usize, handle: &mut RlHandle, ) -> RlResult<Vec<PrioritySample>>

Sample batch_size transitions using stratified proportional sampling.

Stratified: the [0, total_priority] interval is divided into batch_size equal strata and one sample is drawn uniformly from each stratum. This reduces variance compared to fully random sampling.

§Errors

RlError::InsufficientTransitions if size < batch_size.
RlError::ZeroPrioritySum if all priorities are zero.

Trait Implementations§

Source §

impl Clone for PrioritizedReplayBuffer

Source §

fn clone(&self) -> PrioritizedReplayBuffer

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for PrioritizedReplayBuffer

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl UnwindSafe for PrioritizedReplayBuffer

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<T> WithSubscriber for T

Source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

Source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

Struct PrioritizedReplayBuffer Copy item path

Implementations§

impl PrioritizedReplayBuffer

pub fn new( capacity: usize, obs_dim: usize, act_dim: usize, alpha: f64, beta_start: f64, ) -> Self

pub fn push( &mut self, obs: impl AsRef<[f32]>, action: impl AsRef<[f32]>, reward: f32, next_obs: impl AsRef<[f32]>, done: bool, )

pub fn update_priority(&mut self, index: usize, priority: f64)

§Arguments

pub fn set_beta(&mut self, beta: f64)

pub fn anneal_beta(&mut self, step: f64)

pub fn len(&self) -> usize

pub fn is_empty(&self) -> bool

pub fn sample( &self, batch_size: usize, handle: &mut RlHandle, ) -> RlResult<Vec<PrioritySample>>

§Errors

Trait Implementations§

impl Clone for PrioritizedReplayBuffer

fn clone(&self) -> PrioritizedReplayBuffer

fn clone_from(&mut self, source: &Self)

impl Debug for PrioritizedReplayBuffer

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for PrioritizedReplayBuffer

impl RefUnwindSafe for PrioritizedReplayBuffer

impl Send for PrioritizedReplayBuffer

impl Sync for PrioritizedReplayBuffer

impl Unpin for PrioritizedReplayBuffer

impl UnsafeUnpin for PrioritizedReplayBuffer

impl UnwindSafe for PrioritizedReplayBuffer

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct PrioritizedReplayBuffer

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,