Struct relearn::envs::UniformBernoulliBandits[−][src]

pub struct UniformBernoulliBandits {
    pub num_arms: usize,
}

Expand description

A distribution over Beroulli bandit environments with uniformly sampled means.

The mean of each arm is sampled uniformly from [0, 1].

Reference

This environment distribution is used in the paper “RL^2: Fast Reinforcement Learning via Slow Reinforcement Learning” by Duan et al.

Fields

num_arms: usize

Number of bandit arms.

Implementations

[src]

impl UniformBernoulliBandits

[src]

pub const fn new(num_arms: usize) -> Self

Trait Implementations

[src]

impl Clone for UniformBernoulliBandits

[src]

fn clone(&self) -> UniformBernoulliBandits

Returns a copy of the value. Read more

1.0.0[src]

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

[src]

impl Debug for UniformBernoulliBandits

[src]

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

[src]

impl Default for UniformBernoulliBandits

[src]

fn default() -> Self

Returns the “default value” for a type. Read more

[src]

impl EnvStructure for UniformBernoulliBandits

type ObservationSpace = SingletonSpace

type ActionSpace = IndexSpace

[src]

fn observation_space(&self) -> Self::ObservationSpace

Space containing all possible observations. Read more

[src]

fn action_space(&self) -> Self::ActionSpace

The space of all possible actions. Read more

[src]

fn reward_range(&self) -> (f64, f64 )

A lower and upper bound on possible reward values. Read more

[src]

fn discount_factor(&self) -> f64

A discount factor applied to future rewards. Read more

[src]

impl From<&'_ Options> for UniformBernoulliBandits

[src]

fn from(opts: &Options) -> Self

Performs the conversion.

[src]

impl Hash for UniformBernoulliBandits

[src]

fn hash<H: Hasher>(&self, state: &mut H)

Feeds this value into the given Hasher. Read more

1.3.0[src]

fn hash_slice<H>(data: &[Self], state: &mut H) where
H: Hasher,

Feeds a slice of this type into the given Hasher. Read more

[src]

impl PartialEq<UniformBernoulliBandits> for UniformBernoulliBandits

[src]

fn eq(&self, other: &UniformBernoulliBandits) -> bool

This method tests for self and other values to be equal, and is used by ==. Read more

[src]

fn ne(&self, other: &UniformBernoulliBandits) -> bool

This method tests for !=.

[src]

impl PomdpDistribution for UniformBernoulliBandits

type Pomdp = BernoulliBandit

[src]

fn sample_pomdp(&self, rng: &mut StdRng) -> Self::Pomdp

Sample a POMDP from the distribution. Read more

[src]

impl Update<&'_ Options> for UniformBernoulliBandits

[src]

fn update(&mut self, opts: &Options)

Update in-place from the given source value.

[src]

impl StructuralPartialEq for UniformBernoulliBandits

Auto Trait Implementations

impl RefUnwindSafe for UniformBernoulliBandits

impl Send for UniformBernoulliBandits

impl Sync for UniformBernoulliBandits

impl Unpin for UniformBernoulliBandits

impl UnwindSafe for UniformBernoulliBandits

Blanket Implementations

[src]

impl<T> Any for T where
T: 'static + ?Sized,

[src]

pub fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

[src]

impl<T> Borrow<T> for T where
T: ?Sized,

[src]

pub fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

[src]

impl<T> BorrowMut<T> for T where
T: ?Sized,

[src]

pub fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

[src]

impl<T> CastInto<T> for T

[src]

pub fn cast_into(Self) -> T

[src]

impl<T> EnvDistribution for T where
T: PomdpDistribution,

type Environment = PomdpEnv<<T as PomdpDistribution>::Pomdp>

[src]

pub fn sample_environment(
&Self,
&mut StdRng
) -> <T as EnvDistribution>::Environment

Sample an environment from the distribution. Read more

[src]

impl<Q, K> Equivalent<K> for Q where
Q: Eq + ?Sized,
K: Borrow<Q> + ?Sized,

[src]

pub fn equivalent(&self, key: &K) -> bool

Compare self to key and return true if they are equal.

[src]

impl<T> From<T> for T

[src]

pub fn from(t: T) -> T

Performs the conversion.

[src]

impl<T, U> Into for T where
U: From<T>,

[src]

pub fn into(self) -> U

Performs the conversion.

[src]

impl<T> ToOwned for T where
T: Clone,

type Owned = T

The resulting type after obtaining ownership.

[src]

pub fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

[src]

pub fn clone_into(&self, target: &mut T)

🔬 This is a nightly-only experimental API. (toowned_clone_into)

recently added

Uses borrowed data to replace owned data, usually by cloning. Read more

[src]

impl<T, U> TryFrom for T where
U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

[src]

pub fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

[src]

impl<T, U> TryInto for T where
U: TryFrom<T>,

type Error = >::Error

The type returned in the event of a conversion error.

[src]

pub fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

impl<V, T> VZip<V> for T where
V: MultiLane<T>,

pub fn vzip(self) -> V

[src]

impl<T, U> WithUpdate<T> for U where
U: Update<T>,

[src]

pub fn with_update(Self, T) -> U

Apply an update from the given source value.

Struct relearn::envs::UniformBernoulliBandits[−][src]

Reference

Fields

Implementations

impl UniformBernoulliBandits

pub const fn new(num_arms: usize) -> Self

Trait Implementations

impl Clone for UniformBernoulliBandits

fn clone(&self) -> UniformBernoulliBandits

fn clone_from(&mut self, source: &Self)

impl Debug for UniformBernoulliBandits

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for UniformBernoulliBandits

fn default() -> Self

impl EnvStructure for UniformBernoulliBandits

type ObservationSpace = SingletonSpace

type ActionSpace = IndexSpace

fn observation_space(&self) -> Self::ObservationSpace

fn action_space(&self) -> Self::ActionSpace

fn reward_range(&self) -> (f64, f64)

fn discount_factor(&self) -> f64

impl From<&'_ Options> for UniformBernoulliBandits

fn from(opts: &Options) -> Self

impl Hash for UniformBernoulliBandits

fn hash<__H: Hasher>(&self, state: &mut __H)

fn hash_slice<H>(data: &[Self], state: &mut H) where H: Hasher,

impl PartialEq<UniformBernoulliBandits> for UniformBernoulliBandits

fn eq(&self, other: &UniformBernoulliBandits) -> bool

fn ne(&self, other: &UniformBernoulliBandits) -> bool

impl PomdpDistribution for UniformBernoulliBandits

type Pomdp = BernoulliBandit

fn sample_pomdp(&self, rng: &mut StdRng) -> Self::Pomdp

impl Update<&'_ Options> for UniformBernoulliBandits

fn update(&mut self, opts: &Options)

impl CloneBuild for UniformBernoulliBandits

impl Copy for UniformBernoulliBandits

impl Eq for UniformBernoulliBandits

impl StructuralEq for UniformBernoulliBandits

impl StructuralPartialEq for UniformBernoulliBandits

Auto Trait Implementations

impl RefUnwindSafe for UniformBernoulliBandits

impl Send for UniformBernoulliBandits

impl Sync for UniformBernoulliBandits

impl Unpin for UniformBernoulliBandits

impl UnwindSafe for UniformBernoulliBandits

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

pub fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T where T: ?Sized,

pub fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

pub fn borrow_mut(&mut self) -> &mut T

impl<T> CastInto<T> for T

pub fn cast_into(Self) -> T

impl<T> EnvDistribution for T where T: PomdpDistribution,

type Environment = PomdpEnv<<T as PomdpDistribution>::Pomdp>

pub fn sample_environment( &Self, &mut StdRng) -> <T as EnvDistribution>::Environment

impl<Q, K> Equivalent<K> for Q where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

pub fn equivalent(&self, key: &K) -> bool

impl<T> From<T> for T

pub fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

pub fn into(self) -> U

impl<T> ToOwned for T where T: Clone,

type Owned = T

pub fn to_owned(&self) -> T

pub fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

pub fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

pub fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for T where V: MultiLane<T>,

pub fn vzip(self) -> V

impl<T, U> WithUpdate<T> for U where U: Update<T>,

pub fn with_update(Self, T) -> U

fn reward_range(&self) -> (f64, f64 )

fn hash<H: Hasher>(&self, state: &mut H)

fn hash_slice<H>(data: &[Self], state: &mut H) where
H: Hasher,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<T> EnvDistribution for T where
T: PomdpDistribution,

pub fn sample_environment(
&Self,
&mut StdRng
) -> <T as EnvDistribution>::Environment

impl<Q, K> Equivalent<K> for Q where
Q: Eq + ?Sized,
K: Borrow<Q> + ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<T> ToOwned for T where
T: Clone,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

impl<V, T> VZip<V> for T where
V: MultiLane<T>,

impl<T, U> WithUpdate<T> for U where
U: Update<T>,