Struct relearn::torch::critic::Gae[−][src]

pub struct Gae<V> {
    pub gamma: f64,
    pub lambda: f64,
    pub value_fn: V,
}

Expand description

Generalized Advantage Estimator critic.

Note

Currently does not properly handle non-terminal end-of-episode. This assumes that all episodes end with a reward of 0.

High-Dimensional Continuous Control Using Generalized Advantage Estimation. ICLR 2016 by John Schulman, Philipp Moritz, Sergey Levine, Michael I. Jordan, Pieter Abbeel https://arxiv.org/pdf/1506.02438.pdf

Fields

gamma: f64

Clips the environment discount factor to be no more than this.

lambda: f64

Advantage interpolation factor between one-step residuals (=0) and full return (=1).

value_fn: V

State value function module.

Trait Implementations

[src]

impl<V: Clone> Clone for Gae<V>

[src]

fn clone(&self) -> Gae<V>

Returns a copy of the value. Read more

1.0.0[src]

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

[src]

impl<V> Critic for Gae<V> where
V: SequenceModule,

[src]

fn trainable(&self) -> bool

Whether this critic has trainable internal parameters

[src]

fn discount_factor(&self, env_discount_factor: f64) -> f64

Get the discount factor to use when calculating step returns. Read more

[src]

fn seq_packed(&self, features: &dyn PackedHistoryFeaturesView) -> Tensor

Provide values for a packed sequence of steps. Read more

[src]

fn loss(&self, features: &dyn PackedHistoryFeaturesView) -> Option<Tensor>

The loss of any trainable internal variables given the observed history features. Read more

[src]

impl<V: Debug> Debug for Gae<V>

[src]

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

[src]

impl<V: PartialEq> PartialEq<Gae<V>> for Gae<V>

[src]

fn eq(&self, other: &Gae<V>) -> bool

This method tests for self and other values to be equal, and is used by ==. Read more

[src]

fn ne(&self, other: &Gae<V>) -> bool

This method tests for !=.

[src]

impl<V: Copy> Copy for Gae<V>

[src]

impl<V> StructuralPartialEq for Gae<V>

Auto Trait Implementations

impl<V> RefUnwindSafe for Gae<V> where
V: RefUnwindSafe,

impl<V> Send for Gae<V> where
V: Send,

impl<V> Sync for Gae<V> where
V: Sync,

impl<V> Unpin for Gae<V> where
V: Unpin,

impl<V> UnwindSafe for Gae<V> where
V: UnwindSafe,

Blanket Implementations

[src]

impl<T> Any for T where
T: 'static + ?Sized,

[src]

pub fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

[src]

impl<T> Borrow<T> for T where
T: ?Sized,

[src]

pub fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

[src]

impl<T> BorrowMut<T> for T where
T: ?Sized,

[src]

pub fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

[src]

pub fn from(t: T) -> T

Performs the conversion.

[src]

impl<T, U> Into for T where
U: From<T>,

[src]

pub fn into(self) -> U

Performs the conversion.

[src]

impl<T> ToOwned for T where
T: Clone,

type Owned = T

The resulting type after obtaining ownership.

[src]

pub fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

[src]

pub fn clone_into(&self, target: &mut T)

🔬 This is a nightly-only experimental API. (toowned_clone_into)

recently added

Uses borrowed data to replace owned data, usually by cloning. Read more

[src]

impl<T, U> TryFrom for T where
U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

[src]

pub fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

[src]

impl<T, U> TryInto for T where
U: TryFrom<T>,

type Error = >::Error

The type returned in the event of a conversion error.

[src]

pub fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Struct relearn::torch::critic::Gae[−][src]

Note

Reference

Fields

Trait Implementations

impl<V: Clone> Clone for Gae<V>

fn clone(&self) -> Gae<V>

fn clone_from(&mut self, source: &Self)

impl<V> Critic for Gae<V> where V: SequenceModule,

fn trainable(&self) -> bool

fn discount_factor(&self, env_discount_factor: f64) -> f64

fn seq_packed(&self, features: &dyn PackedHistoryFeaturesView) -> Tensor

fn loss(&self, features: &dyn PackedHistoryFeaturesView) -> Option<Tensor>

impl<V: Debug> Debug for Gae<V>

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl<V: PartialEq> PartialEq<Gae<V>> for Gae<V>

fn eq(&self, other: &Gae<V>) -> bool

fn ne(&self, other: &Gae<V>) -> bool

impl<V: Copy> Copy for Gae<V>

impl<V> StructuralPartialEq for Gae<V>

Auto Trait Implementations

impl<V> RefUnwindSafe for Gae<V> where V: RefUnwindSafe,

impl<V> Send for Gae<V> where V: Send,

impl<V> Sync for Gae<V> where V: Sync,

impl<V> Unpin for Gae<V> where V: Unpin,

impl<V> UnwindSafe for Gae<V> where V: UnwindSafe,

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

pub fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where T: ?Sized,

pub fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

pub fn borrow_mut(&mut self) -> &mut T

impl<T> CastInto<T> for T

pub fn cast_into(Self) -> T

impl<T> From<T> for T

pub fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

pub fn into(self) -> U

impl<T> ToOwned for T where T: Clone,

type Owned = T

pub fn to_owned(&self) -> T

pub fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for T where V: MultiLane<T>,

pub fn vzip(self) -> V

impl<V> Critic for Gae<V> where
V: SequenceModule,

impl<V> RefUnwindSafe for Gae<V> where
V: RefUnwindSafe,

impl<V> Send for Gae<V> where
V: Send,

impl<V> Sync for Gae<V> where
V: Sync,

impl<V> Unpin for Gae<V> where
V: Unpin,

impl<V> UnwindSafe for Gae<V> where
V: UnwindSafe,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<T> ToOwned for T where
T: Clone,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

impl<V, T> VZip<V> for T where
V: MultiLane<T>,