//! Return and advantage estimators for on-policy and off-policy RL algorithms.
//!
//! * [`crate::estimator::compute_gae`] — Generalized Advantage Estimation (PPO, A3C)
//! * [`crate::estimator::compute_td_lambda`] — TD(λ) multi-step returns
//! * [`crate::estimator::compute_vtrace`] — V-trace off-policy correction (IMPALA)
//! * [`crate::estimator::compute_retrace`] — Retrace(λ) safe off-policy returns
pub use ;
pub use ;
pub use ;
pub use ;