Struct relearn::envs::UniformBernoulliBandits

source · [−]

pub struct UniformBernoulliBandits {
    pub num_arms: usize,
}

Expand description

A distribution over Beroulli bandit environments with uniformly sampled means.

The mean of each arm is sampled uniformly from [0, 1].

Reference

This environment distribution is used in the paper “RL^2: Fast Reinforcement Learning via Slow Reinforcement Learning” by Duan et al.

Fields

num_arms: usize

Number of bandit arms.

Implementations

source

impl UniformBernoulliBandits

source

pub const fn new(num_arms: usize) -> Self

Trait Implementations

source

impl Clone for UniformBernoulliBandits

source

fn clone(&self) -> UniformBernoulliBandits

Returns a copy of the value. Read more

1.0.0 · source

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

source

impl Debug for UniformBernoulliBandits

source

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

source

impl Default for UniformBernoulliBandits

source

fn default() -> Self

Returns the “default value” for a type. Read more

source

impl<'de> Deserialize<'de> for UniformBernoulliBandits

source

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error> where
__D: Deserializer<'de>,

Deserialize this value from the given Serde deserializer. Read more

source

impl EnvDistribution for UniformBernoulliBandits

type State = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::State

type Observation = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::Observation

type Action = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::Action

type Feedback = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::Feedback

type Environment = Bandit<Bernoulli>

source

fn sample_environment(&self, rng: &mut Prng) -> Self::Environment

Sample an environment from the distribution. Read more

source

impl EnvStructure for UniformBernoulliBandits

type ObservationSpace = SingletonSpace

type ActionSpace = IndexSpace

type FeedbackSpace = IntervalSpace<Reward>

source

fn observation_space(&self) -> Self::ObservationSpace

Space containing all possible observations. Read more

source

fn action_space(&self) -> Self::ActionSpace

The space of all possible actions. Read more

source

fn feedback_space(&self) -> Self::FeedbackSpace

The space of all possible feedback. Read more

source

fn discount_factor(&self) -> f64

A discount factor applied to future feedback. Read more

source

impl Hash for UniformBernoulliBandits

source

fn hash<H: Hasher>(&self, state: &mut H)

Feeds this value into the given Hasher. Read more

1.3.0 · source

fn hash_slice<H>(data: &[Self], state: &mut H) where
H: Hasher,

Feeds a slice of this type into the given Hasher. Read more

source

impl PartialEq<UniformBernoulliBandits> for UniformBernoulliBandits

source

fn eq(&self, other: &UniformBernoulliBandits) -> bool

This method tests for self and other values to be equal, and is used by ==. Read more

source

fn ne(&self, other: &UniformBernoulliBandits) -> bool

This method tests for !=.

source

impl Serialize for UniformBernoulliBandits

source

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error> where
S: Serializer,

Serialize this value into the given Serde serializer. Read more

source

impl StructuralPartialEq for UniformBernoulliBandits

Auto Trait Implementations

impl RefUnwindSafe for UniformBernoulliBandits

impl Send for UniformBernoulliBandits

impl Sync for UniformBernoulliBandits

impl Unpin for UniformBernoulliBandits

impl UnwindSafe for UniformBernoulliBandits

Blanket Implementations

source

impl<T> Any for T where
T: 'static + ?Sized,

source

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

source

impl<T> AsAny for T where
T: Any,

source

fn as_any(&self) -> &(dyn Any + 'static)

Convert into an Any trait reference.

source

impl<T> Borrow<T> for T where
T: ?Sized,

const: unstable · source

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

source

impl<T> BorrowMut<T> for T where
T: ?Sized,

const: unstable · source

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

source

impl<Q, K> Equivalent<K> for Q where
Q: Eq + ?Sized,
K: Borrow<Q> + ?Sized,

source

fn equivalent(&self, key: &K) -> bool

Compare self to key and return true if they are equal.

source

impl<T> From<T> for T

const: unstable · source

fn from(t: T) -> T

Returns the argument unchanged.

source

impl<T, U> Into for T where
U: From<T>,

const: unstable · source

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

impl<T> Pointable for T

const ALIGN: usize = mem::align_of::<T>()

The alignment of pointer.

type Init = T

The type for initializers.

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more

source

impl<T> Same<T> for T

type Output = T

Should always be Self

source

impl<T> ToOwned for T where
T: Clone,

type Owned = T

The resulting type after obtaining ownership.

source

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

source

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

source

impl<T, U> TryFrom for T where
U: Into<T>,

type Error = Infallible

The type returned in the event of a conversion error.

const: unstable · source

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

source

impl<T, U> TryInto for T where
U: TryFrom<T>,

type Error = >::Error

The type returned in the event of a conversion error.

const: unstable · source

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

impl<V, T> VZip<V> for T where
V: MultiLane<T>,

fn vzip(self) -> V

source

impl<T> DeserializeOwned for T where
T: for<'de> Deserialize<'de>,

source

Struct relearn::envs::UniformBernoulliBandits

Fields

Implementations

impl UniformBernoulliBandits

pub const fn new(num_arms: usize) -> Self

Trait Implementations

impl Clone for UniformBernoulliBandits

fn clone(&self) -> UniformBernoulliBandits

fn clone_from(&mut self, source: &Self)

impl Debug for UniformBernoulliBandits

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for UniformBernoulliBandits

fn default() -> Self

impl<'de> Deserialize<'de> for UniformBernoulliBandits

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error> where __D: Deserializer<'de>,

impl EnvDistribution for UniformBernoulliBandits

type State = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::State

type Observation = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::Observation

type Action = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::Action

type Feedback = <<UniformBernoulliBandits as EnvDistribution>::Environment as Environment>::Feedback

type Environment = Bandit<Bernoulli>

fn sample_environment(&self, rng: &mut Prng) -> Self::Environment

impl EnvStructure for UniformBernoulliBandits

type ObservationSpace = SingletonSpace

type ActionSpace = IndexSpace

type FeedbackSpace = IntervalSpace<Reward>

fn observation_space(&self) -> Self::ObservationSpace

fn action_space(&self) -> Self::ActionSpace

fn feedback_space(&self) -> Self::FeedbackSpace

fn discount_factor(&self) -> f64

impl Hash for UniformBernoulliBandits

fn hash<__H: Hasher>(&self, state: &mut __H)

fn hash_slice<H>(data: &[Self], state: &mut H) where H: Hasher,

impl PartialEq<UniformBernoulliBandits> for UniformBernoulliBandits

fn eq(&self, other: &UniformBernoulliBandits) -> bool

fn ne(&self, other: &UniformBernoulliBandits) -> bool

impl Serialize for UniformBernoulliBandits

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error> where __S: Serializer,

impl CloneBuild for UniformBernoulliBandits

impl Copy for UniformBernoulliBandits

impl Eq for UniformBernoulliBandits

impl StructuralEq for UniformBernoulliBandits

impl StructuralPartialEq for UniformBernoulliBandits

Auto Trait Implementations

impl RefUnwindSafe for UniformBernoulliBandits

impl Send for UniformBernoulliBandits

impl Sync for UniformBernoulliBandits

impl Unpin for UniformBernoulliBandits

impl UnwindSafe for UniformBernoulliBandits

Blanket Implementations

impl<T> Any for T where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> AsAny for T where T: Any,

fn as_any(&self) -> &(dyn Any + 'static)

impl<T> Borrow<T> for T where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<Q, K> Equivalent<K> for Q where Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

fn equivalent(&self, key: &K) -> bool

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T where U: From<T>,

fn into(self) -> U

impl<T> Pointable for T

const ALIGN: usize = mem::align_of::<T>()

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> Same<T> for T

type Output = T

impl<T> ToOwned for T where T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for T where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

fn deserialize<D>(deserializer: D) -> Result<Self, D::Error> where
__D: Deserializer<'de>,

fn hash<H: Hasher>(&self, state: &mut H)

fn hash_slice<H>(data: &[Self], state: &mut H) where
H: Hasher,

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error> where
S: Serializer,

impl<T> Any for T where
T: 'static + ?Sized,

impl<T> AsAny for T where
T: Any,

impl<T> Borrow<T> for T where
T: ?Sized,

impl<T> BorrowMut<T> for T where
T: ?Sized,

impl<Q, K> Equivalent<K> for Q where
Q: Eq + ?Sized,
K: Borrow<Q> + ?Sized,

impl<T, U> Into<U> for T where
U: From<T>,

impl<T> ToOwned for T where
T: Clone,

impl<T, U> TryFrom<U> for T where
U: Into<T>,

impl<T, U> TryInto<U> for T where
U: TryFrom<T>,

impl<V, T> VZip<V> for T where
V: MultiLane<T>,

impl<T> DeserializeOwned for T where
T: for<'de> Deserialize<'de>,

impl<T> PomdpStructure for T where
T: EnvStructure<FeedbackSpace = IntervalSpace<Reward>>,