Struct gym_rs::envs::classical_control::cartpole::CartPoleEnv

source ·

pub struct CartPoleEnv {Show 15 fields
    pub action_space: Discrete,
    pub observation_space: BoxR<CartPoleObservation>,
    pub render_mode: RenderMode,
    pub state: CartPoleObservation,
    pub metadata: Metadata<Self>,
    pub gravity: O64,
    pub masscart: O64,
    pub masspole: O64,
    pub length: O64,
    pub force_mag: O64,
    pub tau: O64,
    pub kinematics_integrator: KinematicsIntegrator,
    pub theta_threshold_radians: O64,
    pub x_threshold: O64,
    pub steps_beyond_terminated: Option<usize>,
    /* private fields */
}

Expand description

An environment which implements the cart pole problem described in Neuronlike adaptive elements that can solve difficult learning control problems.

The problem involves applying the correct forces onto a cart with a pole hinged onto it, in order to ensure the pole remains within the preconfigured regions. The agent starts by being assigned random values between (-0.05, 0.05) for all fields available in the state structure. The agent is rewarded ‘+1’ for every step taken until the episode ends.

The episode ends when any of the following conditions occur:

Termination: [CartPoleObservation.theta] is greater than +/-12.0 (pole has fallen).
Termination: [CartPoleObservation.x] is greater than +/-2.4 (cart is outside bounds).
Truncation: Episode length is greater than 500.

Fields§

§action_space: Discrete

The available actions that can be taken.

§observation_space: BoxR<CartPoleObservation>

The range of values that can be observed.

§render_mode: RenderMode

The type of renders produced.

§state: CartPoleObservation

The current state of the environment.

§metadata: Metadata<Self>

Additional pieces of information provided by the environment.

§gravity: O64

The gravity constant applied to the environment..

§masscart: O64

The mass of the cart.

§masspole: O64

The mass of the pole.

§length: O64

Half the length of the pole.

§force_mag: O64

The default force applied to the pole.

§tau: O64

The number of seconds between state updates.

§kinematics_integrator: KinematicsIntegrator

The type of integration done on the differential equations found in the paper.

§theta_threshold_radians: O64

The angle that the pole can lean to before an episode is considered terminated.

§x_threshold: O64

The x value that the cart can be at before an episode is considered terminated.

§steps_beyond_terminated: Option<usize>

The number of steps taken after the episode was terminated.

Struct gym_rs::envs::classical_control::cartpole::CartPoleEnv

Fields§

Implementations§

impl CartPoleEnv

pub fn new(render_mode: RenderMode) -> Self

Trait Implementations§

impl Clone for CartPoleEnv

fn clone(&self) -> CartPoleEnv

fn clone_from(&mut self, source: &Self)

impl Debug for CartPoleEnv

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Env for CartPoleEnv

type Action = usize

type Observation = CartPoleObservation

type Info = ()

type ResetInfo = ()

fn step( &mut self, action: Self::Action ) -> ActionReward<Self::Observation, Self::Info>

fn reset( &mut self, seed: Option<u64>, return_info: bool, options: Option<BoxR<Self::Observation>> ) -> (Self::Observation, Option<Self::ResetInfo>)

fn render(&mut self, mode: RenderMode) -> Renders

fn close(&mut self)

impl EnvProperties for CartPoleEnv

type ActionSpace = Discrete

type ObservationSpace = BoxR<CartPoleObservation>

fn metadata(&self) -> &Metadata<Self>

fn rand_random(&self) -> &Pcg64

fn action_space(&self) -> &Self::ActionSpace

fn observation_space(&self) -> &Self::ObservationSpace

fn render_mode(&self) -> &RenderMode

fn reward_range(&self) -> &RewardRange

impl Serialize for CartPoleEnv

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Auto Trait Implementations§

impl RefUnwindSafe for CartPoleEnv

impl !Send for CartPoleEnv

impl !Sync for CartPoleEnv

impl Unpin for CartPoleEnv

impl UnwindSafe for CartPoleEnv

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> Same<T> for T

type Output = T

impl<SS, SP> SupersetOf<SS> for SPwhere SS: SubsetOf<SP>,

fn to_subset(&self) -> Option<SS>

fn is_in_subset(&self) -> bool

fn to_subset_unchecked(&self) -> SS

fn from_subset(element: &SS) -> SP

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error>where S: Serializer,