cano 0.14.0 - Docs.rs

//! # PollTask — Wait-Until Processing Model
//!
//! A [`PollTask`] repeatedly calls `poll()` until it returns [`PollOutcome::Ready`] or until an
//! optional wall-clock timeout is exceeded. This "wait-until" pattern is the canonical way
//! to poll an external system for completion without blocking a thread.
//!
//! ## When to use `PollTask`
//!
//! - **Waiting for external jobs**: poll a job queue or long-running API until it finishes.
//! - **Adaptive backoff without retries**: the loop *is* the resilience mechanism, so the
//!   default `TaskConfig` is [`TaskConfig::minimal()`] (no outer retry wrapping).
//! - **Condition checks**: loop until a database row exists, a flag flips, etc.
//!
//! Every [`PollTask`] automatically implements [`Task`](crate::task::Task) via a
//! per-impl-site companion `impl Task<S> for T` emitted by the `#[task::poll]` macro.
//! This means you can register a `PollTask` with
//! [`Workflow::register`](crate::workflow::Workflow::register) exactly like any other task.
//!
//! ## Quick Start
//!
//! ```rust
//! use cano::prelude::*;
//! use std::sync::atomic::{AtomicU32, Ordering};
//! use std::sync::Arc;
//!
//! #[derive(Debug, Clone, PartialEq, Eq, Hash)]
//! enum Step { Wait, Done }
//!
//! struct Counter(Arc<AtomicU32>);
//!
//! #[task::poll(state = Step)]
//! impl Counter {
//!     async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
//!         let n = self.0.fetch_add(1, Ordering::Relaxed);
//!         if n >= 2 {
//!             Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
//!         } else {
//!             Ok(PollOutcome::Pending { delay_ms: 0 })
//!         }
//!     }
//! }
//!
//! # #[tokio::main]
//! # async fn main() -> Result<(), CanoError> {
//! let counter = Counter(Arc::new(AtomicU32::new(0)));
//! let workflow = Workflow::bare()
//!     .register(Step::Wait, counter)
//!     .add_exit_state(Step::Done);
//!
//! let result = workflow.orchestrate(Step::Wait).await?;
//! assert_eq!(result, Step::Done);
//! # Ok(())
//! # }
//! ```
//!
//! ## Bounding the poll loop by wall-clock time
//!
//! There is no built-in poll-count limit. To cap total wall-clock time, return a
//! [`TaskConfig`] with an `attempt_timeout` from [`PollTask::config`]:
//!
//! ```rust
//! use cano::prelude::*;
//! use std::time::Duration;
//!
//! #[derive(Debug, Clone, PartialEq, Eq, Hash)]
//! enum Step { Wait, Done }
//!
//! struct BoundedPoller;
//!
//! #[task::poll(state = Step)]
//! impl BoundedPoller {
//!     fn config(&self) -> TaskConfig {
//!         TaskConfig::minimal().with_attempt_timeout(Duration::from_secs(30))
//!     }
//!
//!     async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
//!         Ok(PollOutcome::Pending { delay_ms: 100 })
//!     }
//! }
//! ```
//!
//! The timeout is enforced by the workflow engine when the task is dispatched via
//! [`Workflow::orchestrate`](crate::workflow::Workflow::orchestrate). If the entire
//! poll loop does not complete within the timeout, the workflow receives
//! [`CanoError::Timeout`].
//!
//! ## The trait-impl form
//!
//! You can also write the full `impl PollTask<S> for T` header explicitly:
//!
//! ```rust
//! use cano::prelude::*;
//!
//! #[derive(Debug, Clone, PartialEq, Eq, Hash)]
//! enum Step { Poll, Done }
//!
//! struct TraitPoller;
//!
//! #[task::poll]
//! impl PollTask<Step> for TraitPoller {
//!     async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
//!         Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
//!     }
//! }
//!
//! # #[tokio::main]
//! # async fn main() -> Result<(), CanoError> {
//! let workflow = Workflow::bare()
//!     .register(Step::Poll, TraitPoller)
//!     .add_exit_state(Step::Done);
//!
//! let result = workflow.orchestrate(Step::Poll).await?;
//! assert_eq!(result, Step::Done);
//! # Ok(())
//! # }
//! ```

use crate::error::CanoError;
use crate::resource::Resources;
use crate::task::{TaskConfig, TaskResult};
use std::borrow::Cow;
use std::fmt;
use std::hash::Hash;

// ---------------------------------------------------------------------------
// PollOutcome<TState> — the outcome of a single poll() call
// ---------------------------------------------------------------------------

/// The outcome returned by a single [`PollTask::poll`] call.
///
/// - [`PollOutcome::Ready`] — the condition is satisfied; carry the `TaskResult` forward to the FSM.
/// - [`PollOutcome::Pending`] — not yet ready; sleep for `delay_ms` milliseconds then poll again.
///
/// This mirrors `std::task::Poll` conceptually but carries workflow-specific data and an
/// explicit sleep duration to decouple the poller from async executor wakeup mechanics.
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum PollOutcome<TState> {
    /// The poll condition is satisfied. The inner [`TaskResult`] is forwarded to the FSM.
    Ready(TaskResult<TState>),
    /// Not yet ready. Sleep `delay_ms` milliseconds before the next poll.
    Pending {
        /// Milliseconds to sleep before the next poll call. Use `0` for no delay.
        delay_ms: u64,
    },
}

// ---------------------------------------------------------------------------
// PollErrorPolicy — what to do when poll() returns Err
// ---------------------------------------------------------------------------

/// Controls how the poll loop responds when [`PollTask::poll`] returns an [`Err`].
///
/// Return a non-default policy from [`PollTask::on_poll_error`] to override the default
/// fail-fast behaviour.
#[derive(Debug, Clone, PartialEq, Eq, Default)]
pub enum PollErrorPolicy {
    /// Propagate the error immediately — the loop stops and the error is returned.
    #[default]
    FailFast,
    /// Log and retry up to `max_errors` consecutive errors before failing.
    RetryOnError {
        /// Maximum number of consecutive errors before the loop fails.
        max_errors: u32,
    },
}

// ---------------------------------------------------------------------------
// PollTask trait
// ---------------------------------------------------------------------------

/// A "wait-until" processing model that repeatedly calls [`poll`](PollTask::poll) until
/// it returns [`PollOutcome::Ready`].
///
/// # Generic Types
///
/// - **`TState`**: The state enum used by the workflow (`Clone + Debug + Send + Sync`).
/// - **`TResourceKey`**: The key type used to look up resources (defaults to
///   [`Cow<'static, str>`]).
///
/// # Default config
///
/// Unlike [`RouterTask`](crate::task::router::RouterTask), `PollTask` defaults to
/// [`TaskConfig::minimal()`] (no retries). The poll loop itself is the resilience
/// mechanism; outer retry wrapping rarely makes sense here.
///
/// # Implementing PollTask
///
/// Prefer the inherent `#[task::poll(state = S)]` form:
///
/// ```rust
/// use cano::prelude::*;
///
/// #[derive(Debug, Clone, PartialEq, Eq, Hash)]
/// enum Step { Wait, Done }
///
/// struct MyPoller;
///
/// #[task::poll(state = Step)]
/// impl MyPoller {
///     async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
///         Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
///     }
/// }
/// ```
#[crate::task::poll]
pub trait PollTask<TState, TResourceKey = Cow<'static, str>>: Send + Sync
where
    TState: Clone + fmt::Debug + Send + Sync + 'static,
    TResourceKey: Hash + Eq + Send + Sync + 'static,
{
    /// Get the task configuration that controls execution behaviour.
    ///
    /// Defaults to [`TaskConfig::minimal()`] (no retries, no timeout). Override to
    /// attach a circuit-breaker or per-attempt timeout if needed.
    fn config(&self) -> TaskConfig {
        TaskConfig::minimal()
    }

    /// Human-readable identifier for this poller, reported to [`WorkflowObserver`] hooks.
    ///
    /// Defaults to [`std::any::type_name`] of the implementing type. Override for a
    /// stable, friendly name.
    ///
    /// [`WorkflowObserver`]: crate::observer::WorkflowObserver
    fn name(&self) -> Cow<'static, str> {
        Cow::Borrowed(std::any::type_name::<Self>())
    }

    /// Policy for handling errors returned by [`poll`](PollTask::poll).
    ///
    /// Defaults to [`PollErrorPolicy::FailFast`] — the first error stops the loop.
    /// Override to tolerate transient errors:
    ///
    /// ```rust
    /// use cano::prelude::*;
    ///
    /// #[derive(Debug, Clone, PartialEq, Eq, Hash)]
    /// enum Step { Wait, Done }
    ///
    /// struct ResilientPoller;
    ///
    /// #[task::poll]
    /// impl PollTask<Step> for ResilientPoller {
    ///     fn on_poll_error(&self) -> PollErrorPolicy {
    ///         PollErrorPolicy::RetryOnError { max_errors: 3 }
    ///     }
    ///     async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
    ///         Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
    ///     }
    /// }
    /// ```
    fn on_poll_error(&self) -> PollErrorPolicy {
        PollErrorPolicy::FailFast
    }

    /// Call once per poll iteration.
    ///
    /// Return [`PollOutcome::Ready`] with the next [`TaskResult`] when the condition is met,
    /// or [`PollOutcome::Pending`] with a sleep duration when it is not yet ready.
    ///
    /// # Errors
    ///
    /// Returns [`CanoError`] on a non-recoverable error. The loop's response to the
    /// error is governed by [`on_poll_error`](PollTask::on_poll_error).
    async fn poll(&self, res: &Resources<TResourceKey>) -> Result<PollOutcome<TState>, CanoError>;
}

// ---------------------------------------------------------------------------
// run_poll_loop — the loop body called by the macro-synthesised Task::run
// ---------------------------------------------------------------------------

/// Run the [`PollTask`] poll loop for `p`.
///
/// The synthesised `Task::run` method emitted by `#[task::poll]` delegates here so
/// that the loop body (which needs `tokio::time::sleep`) lives in a single place that
/// can reference `tokio` directly.
///
/// The loop calls `p.poll(res)` repeatedly:
///
/// - `PollOutcome::Ready(result)` → return `Ok(result)`.
/// - `PollOutcome::Pending { delay_ms }` → reset the consecutive-error counter, sleep
///   `delay_ms` ms, then poll again.
/// - `Err(e)` → consult [`PollTask::on_poll_error`]:
///   - [`PollErrorPolicy::FailFast`] → return `Err(e)` immediately.
///   - [`PollErrorPolicy::RetryOnError { max_errors }`] → increment the consecutive-error
///     counter; if it exceeds `max_errors`, return `Err(e)`; otherwise continue.
///
/// There is no built-in iteration limit. To cap total wall-clock time, return
/// `TaskConfig::minimal().with_attempt_timeout(dur)` from [`PollTask::config`] and
/// dispatch the task via [`Workflow::orchestrate`](crate::workflow::Workflow::orchestrate).
pub async fn run_poll_loop<P, S, K>(p: &P, res: &Resources<K>) -> Result<TaskResult<S>, CanoError>
where
    P: PollTask<S, K> + ?Sized,
    S: Clone + fmt::Debug + Send + Sync + 'static,
    K: Hash + Eq + Send + Sync + 'static,
{
    let policy = p.on_poll_error();
    let mut consecutive_errors: u32 = 0;

    loop {
        match p.poll(res).await {
            Ok(PollOutcome::Ready(result)) => {
                #[cfg(feature = "metrics")]
                crate::metrics::poll_iteration(true);
                return Ok(result);
            }
            Ok(PollOutcome::Pending { delay_ms }) => {
                #[cfg(feature = "metrics")]
                crate::metrics::poll_iteration(false);
                consecutive_errors = 0;
                if delay_ms > 0 {
                    tokio::time::sleep(std::time::Duration::from_millis(delay_ms)).await;
                }
            }
            Err(e) => match &policy {
                PollErrorPolicy::FailFast => return Err(e),
                PollErrorPolicy::RetryOnError { max_errors } => {
                    consecutive_errors += 1;
                    if consecutive_errors > *max_errors {
                        return Err(e);
                    }
                }
            },
        }
    }
}

// ---------------------------------------------------------------------------
// Type aliases
// ---------------------------------------------------------------------------

/// Type alias for a dynamic [`PollTask`] trait object.
pub type DynPollTask<TState, TResourceKey = Cow<'static, str>> =
    dyn PollTask<TState, TResourceKey> + Send + Sync;

/// Type alias for an `Arc`-wrapped dynamic [`PollTask`] trait object.
pub type PollTaskObject<TState, TResourceKey = Cow<'static, str>> =
    std::sync::Arc<DynPollTask<TState, TResourceKey>>;

// ---------------------------------------------------------------------------
// Tests
// ---------------------------------------------------------------------------

#[cfg(test)]
mod tests {
    use super::*;
    use crate::resource::Resources;
    use crate::task;
    use crate::task::Task;
    use std::sync::Arc;
    use std::sync::atomic::{AtomicU32, Ordering};

    // Note: all `#[task::poll]` usages inside the `cano` crate itself use the
    // trait-impl form (`impl PollTask<S> for T`), because the inherent form emits
    // `::cano::PollTask<...>` paths that don't resolve inside this crate. The
    // inherent form is tested in `cano-macros/tests/poll_task_impl.rs` where
    // `::cano` resolves correctly.

    #[derive(Debug, Clone, PartialEq, Eq, Hash)]
    enum Step {
        Wait,
        Done,
        Next,
    }

    // ---------------------------------------------------------------------------
    // (a) PollTask that becomes Ready on the first call
    // ---------------------------------------------------------------------------

    struct ImmediatePoller;

    #[task::poll]
    impl PollTask<Step> for ImmediatePoller {
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
        }
    }

    #[tokio::test]
    async fn test_poll_task_immediate_via_poll() {
        let poller = ImmediatePoller;
        let res = Resources::new();
        let result = PollTask::poll(&poller, &res).await.unwrap();
        assert_eq!(result, PollOutcome::Ready(TaskResult::Single(Step::Done)));
    }

    #[tokio::test]
    async fn test_poll_task_immediate_via_task_run() {
        let poller = ImmediatePoller;
        let res = Resources::new();
        let result = Task::run(&poller, &res).await.unwrap();
        assert_eq!(result, TaskResult::Single(Step::Done));
    }

    // ---------------------------------------------------------------------------
    // (b) PollTask that takes multiple polls before becoming Ready
    // ---------------------------------------------------------------------------

    struct CountingPoller {
        target: u32,
        count: AtomicU32,
    }

    impl CountingPoller {
        fn new(target: u32) -> Self {
            Self {
                target,
                count: AtomicU32::new(0),
            }
        }
    }

    #[task::poll]
    impl PollTask<Step> for CountingPoller {
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            let n = self.count.fetch_add(1, Ordering::Relaxed) + 1;
            if n >= self.target {
                Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
            } else {
                Ok(PollOutcome::Pending { delay_ms: 0 })
            }
        }
    }

    #[tokio::test]
    async fn test_poll_task_multiple_polls() {
        let poller = CountingPoller::new(3);
        let res = Resources::new();
        let result = Task::run(&poller, &res).await.unwrap();
        assert_eq!(result, TaskResult::Single(Step::Done));
        assert_eq!(poller.count.load(Ordering::Relaxed), 3);
    }

    // ---------------------------------------------------------------------------
    // (c) Poll error propagates immediately
    // ---------------------------------------------------------------------------

    struct ErrorPoller;

    #[task::poll]
    impl PollTask<Step> for ErrorPoller {
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            Err(CanoError::task_execution("poll failed"))
        }
    }

    #[tokio::test]
    async fn test_poll_task_error_propagates() {
        let poller = ErrorPoller;
        let res = Resources::new();
        let err = Task::run(&poller, &res).await.unwrap_err();
        assert!(matches!(err, CanoError::TaskExecution(_)));
    }

    // ---------------------------------------------------------------------------
    // (d) PollTask returning Split
    // ---------------------------------------------------------------------------

    struct SplitPoller;

    #[task::poll]
    impl PollTask<Step> for SplitPoller {
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            Ok(PollOutcome::Ready(TaskResult::Split(vec![
                Step::Wait,
                Step::Next,
            ])))
        }
    }

    #[tokio::test]
    async fn test_poll_task_split() {
        let poller = SplitPoller;
        let res = Resources::new();
        let result = Task::run(&poller, &res).await.unwrap();
        assert_eq!(result, TaskResult::Split(vec![Step::Wait, Step::Next]));
    }

    // ---------------------------------------------------------------------------
    // (e) Config + name overrides
    // ---------------------------------------------------------------------------

    struct CustomPoller;

    #[task::poll]
    impl PollTask<Step> for CustomPoller {
        fn config(&self) -> TaskConfig {
            TaskConfig::minimal()
        }
        fn name(&self) -> Cow<'static, str> {
            Cow::Borrowed("my-custom-poller")
        }
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
        }
    }

    #[test]
    fn test_poll_task_config_override() {
        let poller = CustomPoller;
        assert_eq!(
            PollTask::<Step>::config(&poller).retry_mode.max_attempts(),
            1
        );
    }

    #[test]
    fn test_poll_task_name_override() {
        let poller = CustomPoller;
        assert_eq!(PollTask::<Step>::name(&poller), "my-custom-poller");
    }

    #[test]
    fn test_companion_task_forwards_config_and_name() {
        let poller = CustomPoller;
        assert_eq!(Task::config(&poller).retry_mode.max_attempts(), 1);
        assert_eq!(Task::name(&poller), "my-custom-poller");
    }

    // ---------------------------------------------------------------------------
    // (f) Default config is minimal (no retries)
    // ---------------------------------------------------------------------------

    struct DefaultConfigPoller;

    #[task::poll]
    impl PollTask<Step> for DefaultConfigPoller {
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
        }
    }

    #[test]
    fn test_poll_task_default_config_is_minimal() {
        let poller = DefaultConfigPoller;
        assert_eq!(
            PollTask::<Step>::config(&poller).retry_mode.max_attempts(),
            1,
            "PollTask default config must be minimal (no retries)"
        );
    }

    #[test]
    fn test_poll_task_default_name_contains_type_name() {
        let poller = DefaultConfigPoller;
        let name = PollTask::<Step>::name(&poller);
        assert!(
            name.contains("DefaultConfigPoller"),
            "default name should contain the type name, got: {name}",
        );
    }

    // ---------------------------------------------------------------------------
    // (g) Dynamic dispatch: Arc<dyn Task<S>>
    // ---------------------------------------------------------------------------

    #[tokio::test]
    async fn test_poll_task_as_dyn_task() {
        let poller: Arc<dyn Task<Step>> = Arc::new(ImmediatePoller);
        let res = Resources::new();
        let result = Task::run(poller.as_ref(), &res).await.unwrap();
        assert_eq!(result, TaskResult::Single(Step::Done));
    }

    // ---------------------------------------------------------------------------
    // (h) Workflow integration
    // ---------------------------------------------------------------------------

    #[tokio::test]
    async fn test_poll_task_in_workflow() {
        use crate::workflow::Workflow;

        struct NextTask;

        #[task]
        impl Task<Step> for NextTask {
            async fn run_bare(&self) -> Result<TaskResult<Step>, CanoError> {
                Ok(TaskResult::Single(Step::Done))
            }
        }

        let poller = CountingPoller::new(2);

        let workflow = Workflow::bare()
            .register(Step::Wait, poller)
            .register(Step::Next, NextTask)
            .add_exit_state(Step::Done);

        // CountingPoller::new(2) -> first poll returns Pending, second returns Ready(Next)
        // But wait: poll 1 => count becomes 1, 1 < 2 => Pending; poll 2 => count becomes 2, 2 >= 2 => Ready(Done)
        // But we registered Step::Done as exit state so Done is the final state
        // Actually CountingPoller returns Single(Step::Done) when ready, so we skip Next entirely
        let result = workflow.orchestrate(Step::Wait).await.unwrap();
        assert_eq!(result, Step::Done);
    }

    // ---------------------------------------------------------------------------
    // (i) run_poll_loop with dyn PollTask (?Sized)
    // ---------------------------------------------------------------------------

    #[tokio::test]
    async fn test_run_poll_loop_dyn_dispatch() {
        let poller: &dyn PollTask<Step> = &ImmediatePoller;
        let res = Resources::new();
        let result = run_poll_loop(poller, &res).await.unwrap();
        assert_eq!(result, TaskResult::Single(Step::Done));
    }

    // ---------------------------------------------------------------------------
    // (j) PollErrorPolicy — RetryOnError succeeds when errors < max_errors
    // ---------------------------------------------------------------------------

    // Emits `count` errors then PollOutcome::Ready.
    struct ErrorThenReadyPoller {
        errors_before_ready: u32,
        count: AtomicU32,
    }

    impl ErrorThenReadyPoller {
        fn new(errors_before_ready: u32) -> Self {
            Self {
                errors_before_ready,
                count: AtomicU32::new(0),
            }
        }
    }

    #[task::poll]
    impl PollTask<Step> for ErrorThenReadyPoller {
        fn on_poll_error(&self) -> PollErrorPolicy {
            PollErrorPolicy::RetryOnError { max_errors: 2 }
        }

        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            let n = self.count.fetch_add(1, Ordering::Relaxed);
            if n < self.errors_before_ready {
                Err(CanoError::task_execution("transient"))
            } else {
                Ok(PollOutcome::Ready(TaskResult::Single(Step::Done)))
            }
        }
    }

    #[tokio::test]
    async fn test_retry_on_error_within_budget_succeeds() {
        // 2 errors then Ready — max_errors = 2 so both errors are tolerated.
        let poller = ErrorThenReadyPoller::new(2);
        let res = Resources::new();
        let result = Task::run(&poller, &res).await.unwrap();
        assert_eq!(result, TaskResult::Single(Step::Done));
        assert_eq!(poller.count.load(Ordering::Relaxed), 3); // 2 errors + 1 Ready
    }

    // ---------------------------------------------------------------------------
    // (k) PollErrorPolicy — RetryOnError fails when consecutive errors exceed max
    // ---------------------------------------------------------------------------

    #[tokio::test]
    async fn test_retry_on_error_exceeds_budget_fails() {
        // 3 consecutive errors with max_errors = 2 → should fail on the 3rd error.
        let poller = ErrorThenReadyPoller::new(3);
        let res = Resources::new();
        let err = Task::run(&poller, &res).await.unwrap_err();
        assert!(matches!(err, CanoError::TaskExecution(_)));
        // poll called exactly 3 times: errors 1, 2, 3 (third exceeds max_errors=2)
        assert_eq!(poller.count.load(Ordering::Relaxed), 3);
    }

    // ---------------------------------------------------------------------------
    // (l) PollErrorPolicy — Pending resets the consecutive-error counter
    // ---------------------------------------------------------------------------

    // Sequence: error → Pending → error → Ready (Pending resets counter)
    struct ErrorPendingErrorReadyPoller {
        count: AtomicU32,
    }

    impl ErrorPendingErrorReadyPoller {
        fn new() -> Self {
            Self {
                count: AtomicU32::new(0),
            }
        }
    }

    #[task::poll]
    impl PollTask<Step> for ErrorPendingErrorReadyPoller {
        fn on_poll_error(&self) -> PollErrorPolicy {
            PollErrorPolicy::RetryOnError { max_errors: 1 }
        }

        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            match self.count.fetch_add(1, Ordering::Relaxed) {
                0 => Err(CanoError::task_execution("first error")),
                1 => Ok(PollOutcome::Pending { delay_ms: 0 }),
                2 => Err(CanoError::task_execution("second error after reset")),
                _ => Ok(PollOutcome::Ready(TaskResult::Single(Step::Done))),
            }
        }
    }

    #[tokio::test]
    async fn test_retry_on_error_pending_resets_counter() {
        // error(1) → Pending resets → error(1) → Ready: should succeed, 4 polls
        let poller = ErrorPendingErrorReadyPoller::new();
        let res = Resources::new();
        let result = Task::run(&poller, &res).await.unwrap();
        assert_eq!(result, TaskResult::Single(Step::Done));
        assert_eq!(poller.count.load(Ordering::Relaxed), 4);
    }

    // ---------------------------------------------------------------------------
    // (m) Default on_poll_error is FailFast
    // ---------------------------------------------------------------------------

    #[tokio::test]
    async fn test_default_on_poll_error_is_fail_fast() {
        // ErrorPoller has no on_poll_error override — default is FailFast.
        // First error should propagate immediately (1 poll call).
        let poller = ErrorPoller;
        let res = Resources::new();
        let err = Task::run(&poller, &res).await.unwrap_err();
        assert!(matches!(err, CanoError::TaskExecution(_)));
        // Verify the default method itself
        assert_eq!(
            PollTask::<Step>::on_poll_error(&poller),
            PollErrorPolicy::FailFast
        );
    }

    // ---------------------------------------------------------------------------
    // (n) attempt_timeout bounds the poll loop when dispatched via Workflow::orchestrate
    // ---------------------------------------------------------------------------

    struct InfinitePendingPoller;

    #[task::poll]
    impl PollTask<Step> for InfinitePendingPoller {
        fn config(&self) -> TaskConfig {
            TaskConfig::minimal().with_attempt_timeout(std::time::Duration::from_millis(20))
        }

        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<Step>, CanoError> {
            Ok(PollOutcome::Pending { delay_ms: 1 })
        }
    }

    #[tokio::test]
    async fn test_attempt_timeout_bounds_infinite_pending_loop() {
        use crate::workflow::Workflow;

        let workflow = Workflow::bare()
            .register(Step::Wait, InfinitePendingPoller)
            .add_exit_state(Step::Done);

        let start = std::time::Instant::now();
        let err = workflow.orchestrate(Step::Wait).await.unwrap_err();
        let elapsed = start.elapsed();

        // The FSM wraps the failure with state context; `.inner()` peels one layer.
        assert!(
            matches!(err.inner(), CanoError::Timeout(_)),
            "expected CanoError::Timeout, got: {err:?}"
        );
        // Should complete well within 500ms even with scheduling jitter
        assert!(
            elapsed < std::time::Duration::from_millis(500),
            "timeout took too long: {elapsed:?}"
        );
    }
}

#[cfg(all(test, feature = "metrics"))]
mod metrics_tests {
    use super::*;
    use crate::metrics::test_support::*;
    use crate::task::Task;
    use std::sync::Arc;
    use std::sync::atomic::{AtomicU32, Ordering};

    #[derive(Debug, Clone, PartialEq, Eq, Hash)]
    enum St {
        Done,
    }

    // PollTask returning Pending twice then Ready(Single(Done))
    struct TwicePendingPoller {
        count: Arc<AtomicU32>,
    }

    // Use the trait-impl form: inside cano the inherent form emits ::cano:: paths
    // that don't resolve; trait-impl form works everywhere.
    #[crate::task::poll]
    impl PollTask<St> for TwicePendingPoller {
        async fn poll(&self, _res: &Resources) -> Result<PollOutcome<St>, CanoError> {
            let n = self.count.fetch_add(1, Ordering::Relaxed);
            if n < 2 {
                Ok(PollOutcome::Pending { delay_ms: 0 })
            } else {
                Ok(PollOutcome::Ready(TaskResult::Single(St::Done)))
            }
        }
    }

    /// Test via run_poll_loop (the free fn used when registered via Workflow::register
    /// with the inherent macro form, and directly exercising the loop body in poll.rs).
    ///
    /// Note: inside `cano`, the trait-impl form of `#[task::poll]` inlines the loop body
    /// rather than delegating to `run_poll_loop`; so we call `run_poll_loop` directly here.
    /// External callers using the inherent `#[task::poll(state = S)]` form always
    /// delegate to `run_poll_loop`.
    #[test]
    fn poll_iterations_counted_pending_twice_ready_once() {
        let (result, rows) = run_with_recorder(|| async {
            let poller = TwicePendingPoller {
                count: Arc::new(AtomicU32::new(0)),
            };
            let res = crate::resource::Resources::new();
            run_poll_loop(&poller, &res).await
        });
        assert!(result.is_ok(), "poll loop should succeed: {result:?}");
        assert_eq!(
            counter(
                &rows,
                "cano_poll_iterations_total",
                &[("outcome", "pending")]
            ),
            2,
            "expected 2 pending iterations"
        );
        assert_eq!(
            counter(&rows, "cano_poll_iterations_total", &[("outcome", "ready")]),
            1,
            "expected 1 ready iteration"
        );
    }
}