kryst 3.2.1 - Docs.rs

//! Flexible GMRES (FGMRES) over the scalar-generic [`KLinOp`] interface with optional
//! mutable preconditioning support.

#[allow(unused_imports)]
use crate::algebra::blas::{dot_conj, nrm2};
use crate::solver::MonitorCallback;
#[allow(unused_imports)]
use crate::algebra::prelude::*;
use crate::algebra::scalar::{copy_real_to_scalar_in, copy_scalar_to_real_in};
use crate::context::ksp_context::{GmresSpec, ReorthPolicy, Workspace};
use crate::error::KError;
use crate::matrix::op::LinOp;
use crate::ops::klinop::KLinOp;
use crate::ops::kpc::KPreconditioner;
use crate::ops::wrap::{as_s_op, as_s_pc_mut};
use crate::parallel::UniverseComm;
use crate::preconditioner::{PcSide, Preconditioner};
use crate::solver::common::{call_monitors, recompute_true_residual_norm_s, ReductCtx};
use crate::solver::LinearSolver;
#[cfg(feature = "metrics")]
use crate::utils::convergence::SolveMetrics;
use crate::utils::convergence::{ConvergedReason, SolveStats};
use crate::utils::monitor::{
    log_krylov_stagnation, log_residuals, stagnation_detected, ResidualSnapshot,
};
use smallvec::SmallVec;
use std::any::Any;

/// Orthogonalization flavor
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
pub enum Orthog {
    Classical,
    Modified,
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
pub enum FgmresVariant {
    Classical,
    Pipelined,
}

pub struct FgmresSolver {
    pub rtol: f64,
    pub atol: f64,
    pub dtol: f64,
    pub maxits: usize,
    pub restart: usize,
    pub orthog: Orthog,
    pub haptol: f64,
    /// If true, size basis/H for maxits; otherwise per-restart sizing.
    pub preallocate: bool,
    /// Optional hook called once per restart (after backsolve) so caller can adapt the PC.
    pub on_restart: Option<Box<dyn FnMut(usize, f64) -> Result<(), KError> + Send + Sync>>,
    /// Whether to treat near-zero residual as a happy breakdown
    pub happy_breakdown: bool,
    pub variant: FgmresVariant,
    /// Strategy for the second orthogonalization pass
    pub reorth: ReorthPolicy,
    /// Threshold used by the "if-needed" reorthogonalization strategy
    pub reorth_tol: f64,
}

impl FgmresSolver {
    pub fn new(rtol: f64, maxits: usize, restart: usize) -> Self {
        Self {
            rtol,
            atol: 1e-12,
            dtol: 1e3,
            maxits,
            restart: restart.max(1),
            orthog: Orthog::Classical,
            haptol: 1e-12,
            preallocate: false,
            on_restart: None,
            happy_breakdown: true,
            variant: FgmresVariant::Classical,
            reorth: ReorthPolicy::IfNeeded,
            reorth_tol: 0.7,
        }
    }

    fn ensure_workspace(&self, w: &mut Workspace, n: usize, m: usize) {
        w.acquire_gmres(GmresSpec {
            n,
            m,
            need_z: true,
            block_s: 0,
        });
    }

    // legacy helpers for in-place Givens rotations removed; Workspace now handles
    // orthogonalization and updating of the Hessenberg system.

    #[allow(clippy::too_many_arguments)]
    pub fn solve_k<A>(
        &mut self,
        a: &A,
        mut pc: Option<&mut dyn KPreconditioner<Scalar = S>>,
        b: &[S],
        x: &mut [S],
        pc_side: PcSide,
        comm: &UniverseComm,
        monitors: Option<&[Box<MonitorCallback<R>>]>,
        work: Option<&mut Workspace>,
    ) -> Result<SolveStats<R>, KError>
    where
        A: KLinOp<Scalar = S> + ?Sized,
    {
        let (m, n) = a.dims();
        if m != n {
            return Err(KError::InvalidInput(
                "FGMRES requires a square operator".to_string(),
            ));
        }
        if b.len() != n || x.len() != n {
            return Err(KError::InvalidInput(
                "FGMRES: vector size mismatch".to_string(),
            ));
        }

        let pc_apply_side = match pc_side {
            PcSide::Right => PcSide::Right,
            PcSide::Left | PcSide::Symmetric => PcSide::Right,
        };

        let block_m = if self.preallocate {
            self.restart.min(self.maxits)
        } else {
            self.restart
        };

        let mut owned_ws;
        let ws = if let Some(w) = work {
            w
        } else {
            owned_ws = Workspace::new(n);
            &mut owned_ws
        };
        self.ensure_workspace(ws, n, block_m);
        let red = ReductCtx::new(comm, Some(&*ws));

        let mons = monitors.unwrap_or(&[]);
        #[cfg(feature = "metrics")]
        let mut metrics = SolveMetrics::default();

        #[cfg(feature = "metrics")]
        let matvec_start = std::time::Instant::now();
        a.matvec_s(x, &mut ws.tmp1[..n], &mut ws.bridge);
        #[cfg(feature = "metrics")]
        {
            metrics.matvec_nanos += matvec_start.elapsed().as_nanos() as u64;
        }
        for i in 0..n {
            ws.tmp1[i] = b[i] - ws.tmp1[i];
        }

        let mut norms = [R::zero(); 2];
        red.norm2_many_into(&[&ws.tmp1[..n], b], &mut norms);
        #[cfg(feature = "metrics")]
        {
            metrics.bytes_reduced += 2 * std::mem::size_of::<R>();
        }
        let mut beta0 = norms[0];
        let bnorm = norms[1].max(1e-32);
        let thr = self.atol.max(self.rtol * bnorm);

        ws.h_mem.fill(S::zero());
        ws.cs.fill(R::default());
        ws.sn.fill(S::zero());
        ws.g.fill(S::zero());
        ws.g[0] = S::from_real(beta0);

        if beta0 > R::default() {
            let inv = S::from_real(1.0 / beta0);
            for (dst, &src) in ws.tmp2[..n].iter_mut().zip(&ws.tmp1[..n]) {
                *dst = src * inv;
            }
            ws.copy_tmp2_into_vcol(0);
        } else {
            ws.v_col(0).fill(S::zero());
        }

        let mut total_iters = 0usize;
        let mut res = beta0;
        let mut stats = SolveStats::new(0, res, ConvergedReason::Continued);
        let red_engine = ws
            .reduction_engine()
            .cloned()
            .unwrap_or_else(|| comm.reduction_engine(ws.reduction_options()));
        let mut pipeline_reductions = 0usize;
        let start_reduct = crate::utils::reduction::test_hooks::wait_counters();

        if call_monitors(mons, 0, res, pipeline_reductions) {
            let counters = crate::utils::convergence::SolverCounters {
                num_global_reductions: pipeline_reductions,
                residual_replacements: 0,
            };
            return Ok(
                SolveStats::new(0, res, ConvergedReason::StoppedByMonitor)
                    .with_counters(counters),
            );
        }
        let true_res = recompute_true_residual_norm_s(
            a,
            b,
            x,
            comm,
            red.engine(),
            &mut ws.tmp1[..n],
            &mut ws.bridge,
        );
        let precond_res = if let Some(pc) = pc.as_deref_mut() {
            pc.apply_mut_s(
                pc_apply_side,
                &ws.tmp1[..n],
                &mut ws.tmp2[..n],
                &mut ws.bridge,
            )?;
            red.norm2(&ws.tmp2[..n])
        } else {
            red.norm2(&ws.tmp1[..n])
        };
        log_residuals(
            0,
            "FGMRES",
            ResidualSnapshot {
                true_residual: true_res,
                preconditioned_residual: precond_res,
                recurrence_residual: Some(res),
            },
        );
        if res <= thr {
            stats.final_residual = res;
            stats.reason = if res <= self.atol {
                ConvergedReason::ConvergedAtol
            } else {
                ConvergedReason::ConvergedRtol
            };
            let true_res = recompute_true_residual_norm_s(
                a,
                b,
                x,
                comm,
                red.engine(),
                &mut ws.tmp1[..n],
                &mut ws.bridge,
            );
            stats.final_residual = true_res;
            let end_reduct = crate::utils::reduction::test_hooks::wait_counters();
            let reductions =
                end_reduct.0 + end_reduct.1 - start_reduct.0 - start_reduct.1 + pipeline_reductions;
            let counters = crate::utils::convergence::SolverCounters {
                num_global_reductions: reductions,
                residual_replacements: 0,
            };
            let mut stats = stats.with_counters(counters);
            #[cfg(feature = "metrics")]
            {
                metrics.reductions = reductions;
                stats.metrics = metrics;
            }
            return Ok(stats);
        }

        let mut stagnation_residuals: Vec<R> = Vec::with_capacity(6);
        let stagnation_threshold = S::from_real(0.95).real();

        while total_iters < self.maxits {
            let m_this = if self.preallocate {
                block_m.min(self.maxits - total_iters)
            } else {
                self.restart.min(self.maxits - total_iters)
            };

            let mut arnoldi_steps = 0usize;
            let mut converged = false;

            for j in 0..m_this {
                match self.variant {
                    FgmresVariant::Classical => {
                        let base = j * n;
                        ws.tmp1[..n].copy_from_slice(&ws.v_mem[base..base + n]);
                        if let Some(pc_ref) = pc.as_deref_mut() {
                            #[cfg(feature = "metrics")]
                            let pc_start = std::time::Instant::now();
                            pc_ref.apply_mut_s(
                                pc_apply_side,
                                &ws.tmp1[..n],
                                &mut ws.tmp2[..n],
                                &mut ws.bridge,
                            )?;
                            #[cfg(feature = "metrics")]
                            {
                                metrics.pc_apply_nanos += pc_start.elapsed().as_nanos() as u64;
                            }
                            ws.z_mem[base..base + n].copy_from_slice(&ws.tmp2[..n]);
                        } else {
                            ws.z_mem[base..base + n].copy_from_slice(&ws.tmp1[..n]);
                        }

                        ws.tmp1[..n].copy_from_slice(&ws.z_mem[base..base + n]);
                        #[cfg(feature = "metrics")]
                        let matvec_start = std::time::Instant::now();
                        a.matvec_s(&ws.tmp1[..n], &mut ws.tmp2[..n], &mut ws.bridge);
                        #[cfg(feature = "metrics")]
                        {
                            metrics.matvec_nanos += matvec_start.elapsed().as_nanos() as u64;
                        }

                        let mut hvals: SmallVec<[S; 32]> = SmallVec::with_capacity(j + 1);
                        hvals.resize(j + 1, S::zero());
                        {
                            let tmp2_slice: &[S] = &ws.tmp2[..n];
                            let mut pairs: SmallVec<[(&[S], &[S]); 32]> =
                                SmallVec::with_capacity(j + 1);
                            for i in 0..=j {
                                let vi = &ws.v_mem[i * n..(i + 1) * n];
                                pairs.push((vi, tmp2_slice));
                            }
                            red.dot_many_into(pairs.as_slice(), hvals.as_mut_slice());
                            #[cfg(feature = "metrics")]
                            {
                                metrics.bytes_reduced += (j + 1) * std::mem::size_of::<R>();
                            }
                        }
                        {
                            let tmp2 = &mut ws.tmp2[..n];
                            for (i, hij) in hvals.iter().copied().enumerate() {
                                let vi = &ws.v_mem[i * n..(i + 1) * n];
                                for (w_i, &vi_val) in tmp2.iter_mut().zip(vi) {
                                    *w_i -= hij * vi_val;
                                }
                            }
                        }
                        if matches!(self.orthog, Orthog::Modified) {
                            let mut corr: SmallVec<[S; 32]> = SmallVec::with_capacity(j + 1);
                            corr.resize(j + 1, S::zero());
                            {
                                let tmp2_slice: &[S] = &ws.tmp2[..n];
                                let mut pairs: SmallVec<[(&[S], &[S]); 32]> =
                                    SmallVec::with_capacity(j + 1);
                                for i in 0..=j {
                                    let vi = &ws.v_mem[i * n..(i + 1) * n];
                                    pairs.push((vi, tmp2_slice));
                                }
                                red.dot_many_into(pairs.as_slice(), corr.as_mut_slice());
                                #[cfg(feature = "metrics")]
                                {
                                    metrics.bytes_reduced += (j + 1) * std::mem::size_of::<R>();
                                }
                            }
                            {
                                let tmp2 = &mut ws.tmp2[..n];
                                for (i, corr_val) in corr.into_iter().enumerate() {
                                    if corr_val.abs() > 1e-12 {
                                        let vi = &ws.v_mem[i * n..(i + 1) * n];
                                        for (w_i, &vi_val) in tmp2.iter_mut().zip(vi) {
                                            *w_i -= corr_val * vi_val;
                                        }
                                        hvals[i] += corr_val;
                                    }
                                }
                            }
                        }
                        for i in 0..=j {
                            *ws.h_at_mut(i, j) = hvals[i];
                        }

                        let hij1 = red.norm2(&ws.tmp2[..n]);
                        #[cfg(feature = "metrics")]
                        {
                            metrics.bytes_reduced += std::mem::size_of::<R>();
                        }
                        *ws.h_at_mut(j + 1, j) = S::from_real(hij1);

                        if hij1 > R::default() {
                            let inv = S::from_real(1.0 / hij1);
                            for val in &mut ws.tmp2[..n] {
                                *val *= inv;
                            }
                            ws.copy_tmp2_into_vcol(j + 1);
                        } else {
                            ws.v_col(j + 1).fill(S::zero());
                        }
                    }
                    FgmresVariant::Pipelined => {
                        let base = j * n;
                        ws.tmp1[..n].copy_from_slice(&ws.v_mem[base..base + n]);
                        if let Some(pc_ref) = pc.as_deref_mut() {
                            #[cfg(feature = "metrics")]
                            let pc_start = std::time::Instant::now();
                            pc_ref.apply_mut_s(
                                pc_apply_side,
                                &ws.tmp1[..n],
                                &mut ws.tmp2[..n],
                                &mut ws.bridge,
                            )?;
                            #[cfg(feature = "metrics")]
                            {
                                metrics.pc_apply_nanos += pc_start.elapsed().as_nanos() as u64;
                            }
                            ws.z_mem[base..base + n].copy_from_slice(&ws.tmp2[..n]);
                        } else {
                            ws.z_mem[base..base + n].copy_from_slice(&ws.tmp1[..n]);
                        }

                        ws.tmp1[..n].copy_from_slice(&ws.z_mem[base..base + n]);
                        #[cfg(feature = "metrics")]
                        let matvec_start = std::time::Instant::now();
                        a.matvec_s(&ws.tmp1[..n], &mut ws.tmp2[..n], &mut ws.bridge);
                        #[cfg(feature = "metrics")]
                        {
                            metrics.matvec_nanos += matvec_start.elapsed().as_nanos() as u64;
                        }

                        ws.pipelined_w[..n].copy_from_slice(&ws.tmp2[..n]);
                        let pipe = ws.pipelined_arnoldi_step(
                            j,
                            n,
                            red_engine.as_ref(),
                            self.reorth,
                            self.reorth_tol,
                        )?;
                        let reductions = match pipe {
                            crate::context::ksp_context::PipeReduct::Sync { reductions } => {
                                reductions
                            }
                            crate::context::ksp_context::PipeReduct::Async { handle } => {
                                #[cfg(feature = "metrics")]
                                let wait_start = std::time::Instant::now();
                                let glob = handle.wait();
                                #[cfg(feature = "metrics")]
                                {
                                    metrics.reduction_wait_nanos +=
                                        wait_start.elapsed().as_nanos() as u64;
                                }
                                ws.finish_pipelined_arnoldi(
                                    j,
                                    n,
                                    red_engine.as_ref(),
                                    self.reorth,
                                    self.reorth_tol,
                                    glob,
                                )?
                            }
                        };
                        pipeline_reductions += reductions;
                        #[cfg(feature = "metrics")]
                        {
                            let payload_len = ws.pipelined_payload.len();
                            metrics.bytes_reduced +=
                                payload_len * std::mem::size_of::<R>() * reductions;
                        }
                    }
                }

                ws.apply_prev_givens_to_col(j, j);
                ws.apply_final_givens_and_update_g(j);

                res = ws.g[j + 1].abs();
                total_iters += 1;
                arnoldi_steps = j + 1;

                if call_monitors(mons, total_iters, res, pipeline_reductions) {
                    let counters = crate::utils::convergence::SolverCounters {
                        num_global_reductions: pipeline_reductions,
                        residual_replacements: 0,
                    };
                    return Ok(
                        SolveStats::new(total_iters, res, ConvergedReason::StoppedByMonitor)
                            .with_counters(counters),
                    );
                }
                let true_res = recompute_true_residual_norm_s(
                    a,
                    b,
                    x,
                    comm,
                    red.engine(),
                    &mut ws.tmp1[..n],
                    &mut ws.bridge,
                );
                let precond_res = if let Some(pc) = pc.as_deref_mut() {
                    pc.apply_mut_s(
                        pc_apply_side,
                        &ws.tmp1[..n],
                        &mut ws.tmp2[..n],
                        &mut ws.bridge,
                    )?;
                    red.norm2(&ws.tmp2[..n])
                } else {
                    red.norm2(&ws.tmp1[..n])
                };
                log_residuals(
                    total_iters,
                    "FGMRES",
                    ResidualSnapshot {
                        true_residual: true_res,
                        preconditioned_residual: precond_res,
                        recurrence_residual: Some(res),
                    },
                );

                stagnation_residuals.push(res);
                if stagnation_residuals.len() > 6 {
                    stagnation_residuals.remove(0);
                }
                if stagnation_detected(&stagnation_residuals, stagnation_threshold) {
                    let action = match self.variant {
                        FgmresVariant::Pipelined => {
                            self.variant = FgmresVariant::Classical;
                            "switching to classical restart"
                        }
                        _ => "restarting FGMRES",
                    };
                    log_krylov_stagnation("FGMRES", total_iters, res, action);
                    stagnation_residuals.clear();
                    break;
                }

                let res0 = beta0;
                let (reason, sstats) = crate::utils::convergence::Convergence {
                    rtol: self.rtol,
                    atol: self.atol,
                    dtol: self.dtol,
                    max_iters: self.maxits,
                }
                .check(res, res0, total_iters);
                stats = sstats;
                if matches!(
                    reason,
                    ConvergedReason::ConvergedRtol | ConvergedReason::ConvergedAtol
                ) {
                    stats.final_residual = res;
                    stats.iterations = total_iters;
                    converged = true;
                    break;
                }
            }

            let k = arnoldi_steps;
            let mut y = vec![S::zero(); k];
            for i in (0..k).rev() {
                let mut sum = ws.g[i];
                for l in (i + 1)..k {
                    sum -= ws.h_at(i, l) * y[l];
                }
                y[i] = sum / ws.h_at(i, i);
            }

            for i in 0..k {
                let zi = &ws.z_mem[i * n..(i + 1) * n];
                for (xj, &zij) in x.iter_mut().zip(zi) {
                    *xj += y[i] * zij;
                }
            }

            if converged {
                stats.reason = if res <= self.atol {
                    ConvergedReason::ConvergedAtol
                } else {
                    ConvergedReason::ConvergedRtol
                };
                stats.final_residual = res;
                break;
            }

            if total_iters >= self.maxits {
                break;
            }

            #[cfg(feature = "metrics")]
            let matvec_start = std::time::Instant::now();
            a.matvec_s(x, &mut ws.tmp1[..n], &mut ws.bridge);
            #[cfg(feature = "metrics")]
            {
                metrics.matvec_nanos += matvec_start.elapsed().as_nanos() as u64;
            }
            for i in 0..n {
                ws.tmp1[i] = b[i] - ws.tmp1[i];
            }
            beta0 = red.norm2(&ws.tmp1[..n]);
            #[cfg(feature = "metrics")]
            {
                metrics.bytes_reduced += std::mem::size_of::<R>();
            }

            ws.h_mem.fill(S::zero());
            ws.cs.fill(R::default());
            ws.sn.fill(S::zero());
            ws.g.fill(S::zero());
            ws.g[0] = S::from_real(beta0);
            if beta0 > R::default() {
                let inv = S::from_real(1.0 / beta0);
                for (dst, &src) in ws.tmp2[..n].iter_mut().zip(&ws.tmp1[..n]) {
                    *dst = src * inv;
                }
                ws.copy_tmp2_into_vcol(0);
            } else {
                ws.v_col(0).fill(S::zero());
            }

            if let Some(hook) = self.on_restart.as_mut() {
                hook(total_iters, beta0)?;
            }
            if let Some(pc_ref) = pc.as_deref_mut() {
                pc_ref.on_restart_s(total_iters, beta0)?;
            }
        }

        stats.iterations = total_iters;

        let true_res = recompute_true_residual_norm_s(
            a,
            b,
            x,
            comm,
            red.engine(),
            &mut ws.tmp1[..n],
            &mut ws.bridge,
        );
        stats.final_residual = true_res;

        if matches!(stats.reason, ConvergedReason::Continued) {
            stats.reason = if true_res <= self.atol {
                ConvergedReason::ConvergedAtol
            } else if true_res <= self.rtol * bnorm {
                ConvergedReason::ConvergedRtol
            } else {
                ConvergedReason::DivergedMaxIts
            };
        }
        let end_reduct = crate::utils::reduction::test_hooks::wait_counters();
        let reductions =
            end_reduct.0 + end_reduct.1 - start_reduct.0 - start_reduct.1 + pipeline_reductions;
        let counters = crate::utils::convergence::SolverCounters {
            num_global_reductions: reductions,
            residual_replacements: 0,
        };
        let mut stats = stats.with_counters(counters);
        #[cfg(feature = "metrics")]
        {
            metrics.reductions = reductions;
            stats.metrics = metrics;
        }
        Ok(stats)
    }

    #[allow(clippy::too_many_arguments)]
    pub fn solve_f64(
        &mut self,
        a: &dyn LinOp<S = f64>,
        pc: Option<&mut dyn Preconditioner>,
        b: &[f64],
        x: &mut [f64],
        pc_side: PcSide,
        comm: &UniverseComm,
        monitors: Option<&[Box<MonitorCallback<f64>>]>,
        work: Option<&mut Workspace>,
    ) -> Result<SolveStats<f64>, KError> {
        let (_, n) = a.dims();
        if b.len() != n || x.len() != n {
            return Err(KError::InvalidInput(
                "FGMRES: vector size mismatch".to_string(),
            ));
        }

        let mut x_s = vec![S::zero(); n];
        copy_real_to_scalar_in(x, &mut x_s);
        let mut b_s = vec![S::zero(); n];
        copy_real_to_scalar_in(b, &mut b_s);

        let op = as_s_op(a);
        let mut pc_storage = pc.map(as_s_pc_mut);
        let stats = self.solve_k(
            &op,
            pc_storage
                .as_mut()
                .map(|w| w as &mut dyn KPreconditioner<Scalar = S>),
            &b_s,
            &mut x_s,
            pc_side,
            comm,
            monitors,
            work,
        )?;

        copy_scalar_to_real_in(&x_s, x);
        Ok(stats)
    }
}

impl LinearSolver for FgmresSolver {
    type Error = KError;

    fn as_any_mut(&mut self) -> &mut dyn Any {
        self
    }

    fn setup_workspace(&mut self, w: &mut Workspace) {
        // Pre-size the GMRES-family buffers during KSP setup using the workspace dimension.
        // FGMRES uses right-preconditioned Arnoldi; left/symmetric inputs map to right.
        let n = w.n();
        if n == 0 {
            return;
        }
        self.ensure_workspace(w, n, self.restart);
    }

    fn solve(
        &mut self,
        a: &dyn LinOp<S = f64>,
        pc: Option<&mut dyn Preconditioner>,
        b: &[f64],
        x: &mut [f64],
        pc_side: PcSide,
        comm: &UniverseComm,
        monitors: Option<&[Box<MonitorCallback<f64>>]>,
        work: Option<&mut Workspace>,
    ) -> Result<SolveStats<f64>, Self::Error> {
        self.solve_f64(a, pc, b, x, pc_side, comm, monitors, work)
    }
}

impl FgmresSolver {
    pub fn set_restart(&mut self, restart: usize) {
        self.restart = restart.max(1);
    }
    pub fn set_orthog(&mut self, o: Orthog) {
        self.orthog = o;
    }
    pub fn set_reorthog(&mut self, flag: bool) {
        self.reorth = if flag {
            ReorthPolicy::Always
        } else {
            ReorthPolicy::Never
        };
    }

    pub fn set_reorth_policy(&mut self, policy: ReorthPolicy) {
        self.reorth = policy;
    }

    pub fn set_reorth_tol(&mut self, tol: f64) {
        self.reorth_tol = tol.max(0.0);
    }
    pub fn set_happy_breakdown(&mut self, flag: bool) {
        self.happy_breakdown = flag;
    }
    pub fn set_variant(&mut self, variant: FgmresVariant) {
        self.variant = variant;
    }

    #[cfg(test)]
    pub fn debug_config(&self) -> (usize, Orthog, bool, bool) {
        (
            self.restart,
            self.orthog,
            !matches!(self.reorth, ReorthPolicy::Never),
            self.happy_breakdown,
        )
    }
}