pub struct RLOptimizer { /* private fields */ }Expand description
Reinforcement Learning optimizer with specialized features
Implementations§
Source§impl RLOptimizer
impl RLOptimizer
pub fn new( policy_lr: f32, value_lr: f32, entropy_coeff: f32, value_loss_coeff: f32, max_grad_norm: f32, ) -> Self
pub fn step_policy( &mut self, params: &mut [Tensor], grads: &[Tensor], ) -> Result<()>
pub fn step_value( &mut self, params: &mut [Tensor], grads: &[Tensor], ) -> Result<()>
Auto Trait Implementations§
impl Freeze for RLOptimizer
impl RefUnwindSafe for RLOptimizer
impl Send for RLOptimizer
impl Sync for RLOptimizer
impl Unpin for RLOptimizer
impl UnwindSafe for RLOptimizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more