Trait RLComponentsTypes

Source

pub trait RLComponentsTypes {
Show 13 associated items
    type Backend: AutodiffBackend;
    type Env: Environment<State = Self::State, Action = Self::Action> + 'static;
    type EnvInit: EnvironmentInit<Self::Env> + Send + 'static;
    type State: Into<<Self::Policy as Policy<Self::Backend>>::Observation> + Clone + Send + 'static;
    type Action: From<<Self::Policy as Policy<Self::Backend>>::Action> + Into<<Self::Policy as Policy<Self::Backend>>::Action> + Clone + Send + 'static;
    type Policy: Policy<Self::Backend, Observation = Self::PolicyObs, ActionDistribution = Self::PolicyAD, Action = Self::PolicyAction, ActionContext = Self::ActionContext, PolicyState = Self::PolicyState> + Send + 'static;
    type PolicyObs: Clone + Send + Batchable + 'static;
    type PolicyAD: Clone + Send + Batchable;
    type PolicyAction: Clone + Send + Batchable;
    type ActionContext: ItemLazy + Clone + Send + 'static;
    type PolicyState: Clone + Send + PolicyState<Self::Backend> + 'static;
    type LearningAgent: PolicyLearner<Self::Backend, TrainContext = Self::TrainingOutput, InnerPolicy = Self::Policy> + Send + 'static;
    type TrainingOutput: ItemLazy + Clone + Send;
}

Available on crate feature rl only.

Expand description

All components used by the reinforcement learning paradigm, grouped in one trait.

Required Associated Types§

Source

type Backend: AutodiffBackend

The backend used for training.

Source

type Env: Environment<State = Self::State, Action = Self::Action> + 'static

The learning environment.

Source

type EnvInit: EnvironmentInit<Self::Env> + Send + 'static

Specifies how to initialize the environment.

Source

type State: Into<<Self::Policy as Policy<Self::Backend>>::Observation> + Clone + Send + 'static

The type of the environment state.

Source

type Action: From<<Self::Policy as Policy<Self::Backend>>::Action> + Into<<Self::Policy as Policy<Self::Backend>>::Action> + Clone + Send + 'static

The type of the environment action.

Source

type Policy: Policy<Self::Backend, Observation = Self::PolicyObs, ActionDistribution = Self::PolicyAD, Action = Self::PolicyAction, ActionContext = Self::ActionContext, PolicyState = Self::PolicyState> + Send + 'static

The policy used to take actions in the environment.

Source

type PolicyObs: Clone + Send + Batchable + 'static

The policy’s observation type.

Source

type PolicyAD: Clone + Send + Batchable

The policy’s action distribution type.

Source

type PolicyAction: Clone + Send + Batchable

The policy’s action type.

Source

type ActionContext: ItemLazy + Clone + Send + 'static

Additional data as context for an agent’s action.

Source

type PolicyState: Clone + Send + PolicyState<Self::Backend> + 'static

The state of the parameterized policy.

Source

type LearningAgent: PolicyLearner<Self::Backend, TrainContext = Self::TrainingOutput, InnerPolicy = Self::Policy> + Send + 'static

The learning agent.

Source

type TrainingOutput: ItemLazy + Clone + Send

The output data of a training step.

Implementors§

Source §

impl<B, E, EI, A> RLComponentsTypes for RLComponentsMarker<B, E, EI, A>
where B: AutodiffBackend, E: Environment + 'static, EI: EnvironmentInit<E> + Send + 'static, A: PolicyLearner + Send + 'static, A::TrainContext: ItemLazy + Clone + Send, A::InnerPolicy: Policy + Send, <A::InnerPolicy as Policy>::Observation: Batchable + Clone + Send, <A::InnerPolicy as Policy>::ActionDistribution: Batchable + Clone + Send, <A::InnerPolicy as Policy>::Action: Batchable + Clone + Send, <A::InnerPolicy as Policy>::ActionContext: ItemLazy + Clone + Send + 'static, <A::InnerPolicy as Policy>::PolicyState: Clone + Send, E::State: Into<<A::InnerPolicy as Policy>::Observation> + Clone + Send + 'static, E::Action: From<<A::InnerPolicy as Policy>::Action> + Into<<A::InnerPolicy as Policy>::Action> + Clone + Send + 'static,

Source §

type PolicyAD = <<A as PolicyLearner>::InnerPolicy as Policy>::ActionDistribution

Source §

type PolicyAction = <<A as PolicyLearner>::InnerPolicy as Policy>::Action

Source §

type ActionContext = <<A as PolicyLearner>::InnerPolicy as Policy>::ActionContext

Source §

type PolicyState = <<A as PolicyLearner>::InnerPolicy as Policy>::PolicyState

Source §

type TrainingOutput = <A as PolicyLearner>::TrainContext

Source §

type State = <E as Environment>::State

Source §

RLComponentsTypes

Trait RLComponentsTypes

Required Associated Types§

type Backend: AutodiffBackend

type Env: Environment<State = Self::State, Action = Self::Action> + 'static

type EnvInit: EnvironmentInit<Self::Env> + Send + 'static

type State: Into<<Self::Policy as Policy<Self::Backend>>::Observation> + Clone + Send + 'static

type Action: From<<Self::Policy as Policy<Self::Backend>>::Action> + Into<<Self::Policy as Policy<Self::Backend>>::Action> + Clone + Send + 'static

type Policy: Policy<Self::Backend, Observation = Self::PolicyObs, ActionDistribution = Self::PolicyAD, Action = Self::PolicyAction, ActionContext = Self::ActionContext, PolicyState = Self::PolicyState> + Send + 'static

type PolicyObs: Clone + Send + Batchable + 'static

type PolicyAD: Clone + Send + Batchable

type PolicyAction: Clone + Send + Batchable

type ActionContext: ItemLazy + Clone + Send + 'static

type PolicyState: Clone + Send + PolicyState<Self::Backend> + 'static

type LearningAgent: PolicyLearner<Self::Backend, TrainContext = Self::TrainingOutput, InnerPolicy = Self::Policy> + Send + 'static

type TrainingOutput: ItemLazy + Clone + Send

Implementors§

type Backend = B

type Env = E

type EnvInit = EI

type LearningAgent = A

type Policy = <A as PolicyLearner<B>>::InnerPolicy

type PolicyObs = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::Observation

type PolicyAD = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::ActionDistribution

type PolicyAction = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::Action

type ActionContext = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::ActionContext

type PolicyState = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::PolicyState

type TrainingOutput = <A as PolicyLearner<B>>::TrainContext

type State = <E as Environment>::State

type Action = <E as Environment>::Action

RLComponentsTypes

Trait RLComponentsTypes Copy item path

Required Associated Types§

type Backend: AutodiffBackend

type Env: Environment<State = Self::State, Action = Self::Action> + 'static

type EnvInit: EnvironmentInit<Self::Env> + Send + 'static

type State: Into<<Self::Policy as Policy<Self::Backend>>::Observation> + Clone + Send + 'static

type Action: From<<Self::Policy as Policy<Self::Backend>>::Action> + Into<<Self::Policy as Policy<Self::Backend>>::Action> + Clone + Send + 'static

type Policy: Policy<Self::Backend, Observation = Self::PolicyObs, ActionDistribution = Self::PolicyAD, Action = Self::PolicyAction, ActionContext = Self::ActionContext, PolicyState = Self::PolicyState> + Send + 'static

type PolicyObs: Clone + Send + Batchable + 'static

type PolicyAD: Clone + Send + Batchable

type PolicyAction: Clone + Send + Batchable

type ActionContext: ItemLazy + Clone + Send + 'static

type PolicyState: Clone + Send + PolicyState<Self::Backend> + 'static

type LearningAgent: PolicyLearner<Self::Backend, TrainContext = Self::TrainingOutput, InnerPolicy = Self::Policy> + Send + 'static

type TrainingOutput: ItemLazy + Clone + Send

Implementors§

type Backend = B

type Env = E

type EnvInit = EI

type LearningAgent = A

type Policy = <A as PolicyLearner<B>>::InnerPolicy

type PolicyObs = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::Observation

type PolicyAD = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::ActionDistribution

type PolicyAction = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::Action

type ActionContext = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::ActionContext

type PolicyState = <<A as PolicyLearner<B>>::InnerPolicy as Policy<B>>::PolicyState

type TrainingOutput = <A as PolicyLearner<B>>::TrainContext

type State = <E as Environment>::State

type Action = <E as Environment>::Action

Trait RLComponentsTypes