pub struct PAL<Q> {
pub q_func: Q,
pub alpha: f64,
pub gamma: f64,
}Expand description
Persistent Advantage Learning
§References
- Bellemare, Marc G., et al. “Increasing the Action Gap: New Operators for Reinforcement Learning.” AAAI. 2016.
Fields§
§q_func: Q§alpha: f64§gamma: f64Trait Implementations§
Source§impl<'m, S, Q> Handler<&'m Transition<S, usize>> for PAL<Q>where
Q: Enumerable<(&'m S,), Output = Vec<f64>> + Handler<StateActionUpdate<&'m S, usize, f64>>,
<Q as Function<(&'m S,)>>::Output: Index<usize, Output = f64> + IntoIterator,
<<Q as Function<(&'m S,)>>::Output as IntoIterator>::IntoIter: ExactSizeIterator,
impl<'m, S, Q> Handler<&'m Transition<S, usize>> for PAL<Q>where
Q: Enumerable<(&'m S,), Output = Vec<f64>> + Handler<StateActionUpdate<&'m S, usize, f64>>,
<Q as Function<(&'m S,)>>::Output: Index<usize, Output = f64> + IntoIterator,
<<Q as Function<(&'m S,)>>::Output as IntoIterator>::IntoIter: ExactSizeIterator,
type Response = <Q as Handler<StateActionUpdate<&'m S, usize>>>::Response
type Error = <Q as Handler<StateActionUpdate<&'m S, usize>>>::Error
fn handle( &mut self, t: &'m Transition<S, usize>, ) -> Result<Self::Response, Self::Error>
fn handle_unchecked(&mut self, msg: M) -> Self::Response
Source§impl<Q> Parameterised for PAL<Q>where
Q: Parameterised,
impl<Q> Parameterised for PAL<Q>where
Q: Parameterised,
Source§fn weights_dim(&self) -> (usize, usize)
fn weights_dim(&self) -> (usize, usize)
Return the dimensions of the weight matrix.
Source§fn weights_view(&self) -> WeightsView<'_>
fn weights_view(&self) -> WeightsView<'_>
Return a read-only view of the weights.
Source§fn weights_view_mut(&mut self) -> WeightsViewMut<'_>
fn weights_view_mut(&mut self) -> WeightsViewMut<'_>
Return a mutable view of the weights.
fn n_weights(&self) -> usize
Auto Trait Implementations§
impl<Q> Freeze for PAL<Q>where
Q: Freeze,
impl<Q> RefUnwindSafe for PAL<Q>where
Q: RefUnwindSafe,
impl<Q> Send for PAL<Q>where
Q: Send,
impl<Q> Sync for PAL<Q>where
Q: Sync,
impl<Q> Unpin for PAL<Q>where
Q: Unpin,
impl<Q> UnsafeUnpin for PAL<Q>where
Q: UnsafeUnpin,
impl<Q> UnwindSafe for PAL<Q>where
Q: UnwindSafe,
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more