Struct DeterministicPolicy

Source

pub struct DeterministicPolicy { /* private fields */ }

Expand description

Deterministic policy wrapper for DDPG/TD3.

Holds only the action bounds and exploration noise configuration; the network parameters (μ_θ(s)) are managed externally.

Implementations§

Source §

impl DeterministicPolicy

Source

pub fn new(action_dim: usize) -> Self

Create a policy with symmetric action bounds [-1, 1].

Source

pub fn with_bounds(action_dim: usize, action_low: f32, action_high: f32) -> Self

Create a policy with custom action bounds.

Source

pub fn action_dim(&self) -> usize

Number of action dimensions.

Source

pub fn clip_action(&self, action: &[f32]) -> RlResult<Vec<f32>>

Clip action to [action_low, action_high].

§Errors

RlError::DimensionMismatch if action.len() != action_dim.

Source

pub fn exploration_action( &self, action: &[f32], sigma: f32, handle: &mut RlHandle, ) -> RlResult<Vec<f32>>

Add Gaussian exploration noise and clip.

Returns clip(action + N(0, σ²), low, high).

§Errors

RlError::DimensionMismatch if action.len() != action_dim.

Source

pub fn smooth_target_action( &self, action: &[f32], sigma: f32, clip_c: f32, handle: &mut RlHandle, ) -> RlResult<Vec<f32>>

TD3 target policy smoothing: add clipped noise to target actions.

ã = clip(action + clip(N(0, σ²), -c, c), low, high)

§Errors

RlError::DimensionMismatch if action.len() != action_dim.

Trait Implementations§

Source §

impl Clone for DeterministicPolicy

Source §

fn clone(&self) -> DeterministicPolicy

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for DeterministicPolicy

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Auto Trait Implementations§

§

impl UnwindSafe for DeterministicPolicy

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T> Instrument for T

Source §

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more

Source §

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<T> WithSubscriber for T

Source §

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more

Source §

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more

Struct DeterministicPolicy Copy item path

Implementations§

impl DeterministicPolicy

pub fn new(action_dim: usize) -> Self

pub fn with_bounds(action_dim: usize, action_low: f32, action_high: f32) -> Self

pub fn action_dim(&self) -> usize

pub fn clip_action(&self, action: &[f32]) -> RlResult<Vec<f32>>

§Errors

pub fn exploration_action( &self, action: &[f32], sigma: f32, handle: &mut RlHandle, ) -> RlResult<Vec<f32>>

§Errors

pub fn smooth_target_action( &self, action: &[f32], sigma: f32, clip_c: f32, handle: &mut RlHandle, ) -> RlResult<Vec<f32>>

§Errors

Trait Implementations§

impl Clone for DeterministicPolicy

fn clone(&self) -> DeterministicPolicy

fn clone_from(&mut self, source: &Self)

impl Debug for DeterministicPolicy

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for DeterministicPolicy

impl RefUnwindSafe for DeterministicPolicy

impl Send for DeterministicPolicy

impl Sync for DeterministicPolicy

impl Unpin for DeterministicPolicy

impl UnsafeUnpin for DeterministicPolicy

impl UnwindSafe for DeterministicPolicy

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T> Instrument for T

fn instrument(self, span: Span) -> Instrumented<Self>

fn in_current_span(self) -> Instrumented<Self>

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WithSubscriber for T

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>where S: Into<Dispatch>,

fn with_current_subscriber(self) -> WithDispatch<Self>

Struct DeterministicPolicy

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,