Struct TrainingSession

Source

pub struct TrainingSession<E: Environment, A> { /* private fields */ }

Expand description

A self-contained, loop-agnostic training coordinator.

TrainingSession wires together a LearningAgent, an optional TrainingRun, and a StatsTracker. It is driven purely by incoming data – it does not own a training loop. Feed it experiences and episode boundaries from wherever your loop lives: a plain for loop, Bevy’s ECS, or anything else.

§Usage

let session = TrainingSession::new(agent)
    .with_run(TrainingRun::create("cartpole", "v1")?)
    .with_max_steps(200_000)
    .with_checkpoint_freq(10_000);

// Each environment step:
session.observe(experience);

// Each episode end:
session.on_episode(total_reward, steps, status, env_extras);

if session.is_done() { break; }

TrainingSession

Struct TrainingSession Copy item path

§Usage

Implementations§

impl<E, A> TrainingSession<E, A>where E: Environment, E::Observation: Clone + Send + Sync + 'static, E::Action: Clone + Send + Sync + 'static, A: LearningAgent<E>,

pub fn new(agent: A) -> Self

pub fn with_run(self, run: TrainingRun) -> Self

pub fn with_max_steps(self, n: usize) -> Self

pub fn with_checkpoint_freq(self, freq: usize) -> Self

pub fn with_keep_checkpoints(self, keep: usize) -> Self

pub fn with_stats(self, stats: StatsTracker) -> Self

pub fn act(&mut self, obs: &E::Observation, mode: ActMode) -> E::Action

pub fn observe(&mut self, experience: Experience<E::Observation, E::Action>)

pub fn on_episode( &mut self, total_reward: f64, steps: usize, status: EpisodeStatus, env_extras: HashMap<String, f64>, )

pub fn on_episode_start(&mut self)

pub fn total_steps(&self) -> usize

pub fn steps_per_sec(&self) -> f64

pub fn is_done(&self) -> bool

pub fn on_eval_episode(&self, record: &EpisodeRecord)

pub fn maybe_save_best(&mut self, mean_reward: f64)

pub fn agent(&self) -> &A

pub fn agent_mut(&mut self) -> &mut A

pub fn stats_summary(&self) -> HashMap<String, f64>

pub fn run(&self) -> Option<&TrainingRun>

pub fn into_agent(self) -> A

pub fn eval_report(&self, n_episodes: usize) -> EvalReport

Auto Trait Implementations§

impl<E, A> Freeze for TrainingSession<E, A>where A: Freeze,

impl<E, A> !RefUnwindSafe for TrainingSession<E, A>

impl<E, A> Send for TrainingSession<E, A>where A: Send, E: Send,

impl<E, A> Sync for TrainingSession<E, A>where A: Sync, E: Sync,

impl<E, A> Unpin for TrainingSession<E, A>where A: Unpin, E: Unpin,

impl<E, A> UnsafeUnpin for TrainingSession<E, A>where A: UnsafeUnpin,

impl<E, A> !UnwindSafe for TrainingSession<E, A>

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoComptime for T

fn comptime(self) -> Self

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct TrainingSession

impl<E, A> TrainingSession<E, A>
where E: Environment, E::Observation: Clone + Send + Sync + 'static, E::Action: Clone + Send + Sync + 'static, A: LearningAgent<E>,

impl<E, A> Freeze for TrainingSession<E, A>
where A: Freeze,

impl<E, A> Send for TrainingSession<E, A>
where A: Send, E: Send,

impl<E, A> Sync for TrainingSession<E, A>
where A: Sync, E: Sync,

impl<E, A> Unpin for TrainingSession<E, A>
where A: Unpin, E: Unpin,

impl<E, A> UnsafeUnpin for TrainingSession<E, A>
where A: UnsafeUnpin,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,