d5/d0e/BiCGStabLSolver_8h_source.html

// -*- tab-width: 2; indent-tabs-mode: nil; coding: utf-8-with-signature -*-

//-----------------------------------------------------------------------------

// Copyright 2000-2026 CEA (www.cea.fr) IFPEN (www.ifpenergiesnouvelles.com)

// See the top-level COPYRIGHT file for details.

// SPDX-License-Identifier: Apache-2.0

//-----------------------------------------------------------------------------

/*---------------------------------------------------------------------------*/

/* solver_bicgstabl.h                                          (C) 2000-2026 */

/*                                                                           */

/* BiCGStab(L) iterative method.                              .              */

/*---------------------------------------------------------------------------*/

#ifndef ARCCORE_ALINA_BICGSTABL_H

#define ARCCORE_ALINA_BICGSTABL_H

/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/

/*

 * This file is based on the work on AMGCL library (version march 2026)

 * which can be found at https://github.com/ddemidov/amgcl.

 *

 * Copyright (c) 2012-2022 Denis Demidov <dennis.demidov@gmail.com>

 * SPDX-License-Identifier: MIT

 */

/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/

/*

 *

 * The code is ported from PETSC BCGSL [1] and is based on [2].

 *

 * [1] http://www.mcs.anl.gov/petsc/petsc-current/docs/manualpages/KSP/KSPBCGSL.html

 * [2] Fokkema, Diederik R. Enhanced implementation of BiCGstab (l) for solving

 *     linear systems of equations. Universiteit Utrecht. Mathematisch Instituut,

 *     1996.


 The original code came with the following license:


 Copyright (c) 1991-2014, UChicago Argonne, LLC and the PETSc Development Team

 All rights reserved.


 Redistribution and use in source and binary forms, with or without modification,

 are permitted provided that the following conditions are met:


 * Redistributions of source code must retain the above copyright notice, this

 list of conditions and the following disclaimer.

 * Redistributions in binary form must reproduce the above copyright notice, this

 list of conditions and the following disclaimer in the documentation and/or

 other materials provided with the distribution.


 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND

 ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED

 WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE

 DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR

 ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES

 (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;

 LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON

 ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT

 (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS

 SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

*/

/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


#include "arccore/alina/ValueTypeInterface.h"

#include "arccore/alina/SolverUtils.h"

#include "arccore/alina/QRFactorizationImpl.h"

#include "arccore/alina/SolverBase.h"


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


namespace Arcane::Alina

{


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


struct BiCGStabLSolverParams

{

  using params = BiCGStabLSolverParams;


  // Order of the method.

  int L = 2;


  // Threshold used to decide when to refresh computed residuals.

  double delta = 0.0;


  // Use a convex function of the MinRes and OR polynomials

  // after the BiCG step instead of default MinRes

  bool convex = true;


  // Preconditioning kind (left/right).

  ePreconditionerSideType pside = ePreconditionerSideType::right;


  // Maximum number of iterations.

  Int32 maxiter = 100;


  // Target relative residual error.

  double tol = 1e-8;


  // Target absolute residual error.

  double abstol = std::numeric_limits<double>::min();


  bool ns_search = false;


  bool verbose = false;


  BiCGStabLSolverParams() = default;


  BiCGStabLSolverParams(const PropertyTree& p)

  : ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, L)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, delta)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, convex)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, pside)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, maxiter)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, tol)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, abstol)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, ns_search)

  , ARCCORE_ALINA_PARAMS_IMPORT_VALUE(p, verbose)

  {

    p.check_params({ "L", "delta", "convex", "pside", "maxiter", "tol", "abstol", "ns_search", "verbose" });

  }


  void get(PropertyTree& p, const std::string& path) const

  {

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, L);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, delta);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, convex);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, pside);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, maxiter);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, tol);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, abstol);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, ns_search);

    ARCCORE_ALINA_PARAMS_EXPORT_VALUE(p, path, verbose);

  }

};


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/

template <class Backend, class InnerProduct = detail::default_inner_product>


class BiCGStabLSolver

: public SolverBase

{

 public:


  using backend_type = Backend;

  using BackendType = Backend;


  typedef typename Backend::vector vector;

  typedef typename Backend::value_type value_type;

  typedef typename Backend::params backend_params;


  typedef typename math::scalar_of<value_type>::type scalar_type;


  typedef typename math::inner_product_impl<

  typename math::rhs_of<value_type>::type>::return_type coef_type;


  using params = BiCGStabLSolverParams;


  BiCGStabLSolver(size_t n,

                  const params& prm = params(),

                  const backend_params& backend_prm = backend_params(),

                  const InnerProduct& inner_product = InnerProduct())

  : prm(prm)

  , n(n)

  , Rt(Backend::create_vector(n, backend_prm))

  , X(Backend::create_vector(n, backend_prm))

  , B(Backend::create_vector(n, backend_prm))

  , T(Backend::create_vector(n, backend_prm))

  , R(prm.L + 1)

  , U(prm.L + 1)

  , MZa(prm.L + 1, prm.L + 1)

  , MZb(prm.L + 1, prm.L + 1)

  , Y0(prm.L + 1)

  , YL(prm.L + 1)

  , inner_product(inner_product)

  {

    precondition(prm.L > 0, "L in BiCGStab(L) should be >=1");


    for (int i = 0; i <= prm.L; ++i) {

      R[i] = Backend::create_vector(n, backend_prm);

      U[i] = Backend::create_vector(n, backend_prm);

    }

  }


  /*

   * \brief Computes the solution for the given system matrix.

   *

   * Computes the solution for the given system matrix \p A and the

   * right-hand side \p rhs.  Returns the number of iterations made and

   * the achieved residual as a ``std::tuple``. The solution vector

   * \p x provides initial approximation in input and holds the computed

   * solution on output.

   *

   * The system matrix may differ from the matrix used during

   * initialization. This may be used for the solution of non-stationary

   * problems with slowly changing coefficients. There is a strong chance

   * that a preconditioner built for a time step will act as a reasonably

   * good preconditioner for several subsequent time steps [DeSh12]_.

   */

  template <class Matrix, class Precond, class Vec1, class Vec2>

  SolverResult operator()(const Matrix& A, const Precond& P, const Vec1& rhs, Vec2&& x) const

  {

    static const coef_type one = math::identity<coef_type>();

    static const coef_type zero = math::zero<coef_type>();


    const int L = prm.L;


    ScopedStreamModifier ss(std::cout);


    scalar_type norm_rhs = norm(rhs);


    // Check if there is a trivial solution

    if (norm_rhs < Alina::detail::eps<scalar_type>(1)) {

      if (prm.ns_search) {

        norm_rhs = math::identity<scalar_type>();

      }

      else {

        backend::clear(x);

        return SolverResult(0, norm_rhs);

      }

    }


    if (prm.pside == ePreconditionerSideType::left) {

      backend::residual(rhs, A, x, *T);

      P.apply(*T, *B);

    }

    else {

      backend::residual(rhs, A, x, *B);

    }


    scalar_type zeta0 = norm(*B);

    scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);


    coef_type alpha = zero;

    coef_type rho0 = one;

    coef_type omega = one;


    // Go

    backend::copy(*B, *R[0]);

    backend::copy(*B, *Rt);

    backend::clear(*X);

    backend::clear(*U[0]);


    scalar_type zeta = zeta0;

    scalar_type rnmax_computed = zeta0;

    scalar_type rnmax_true = zeta0;


    size_t iter = 0;

    for (; iter < prm.maxiter && zeta >= eps; iter += L) {

      // BiCG part

      rho0 = -omega * rho0;


      for (int j = 0; j < L; ++j) {

        coef_type rho1 = inner_product(*R[j], *Rt);

        precondition(!math::is_zero(rho1), "BiCGStab(L) breakdown: diverged (zero rho)");


        coef_type beta = alpha * (rho1 / rho0);

        rho0 = rho1;


        for (int i = 0; i <= j; ++i)

          backend::axpby(one, *R[i], -beta, *U[i]);


        preconditioner_spmv(prm.pside, P, A, *U[j], *U[j + 1], *T);


        coef_type sigma = inner_product(*U[j + 1], *Rt);

        precondition(!math::is_zero(sigma), "BiCGStab(L) breakdown: diverged (zero sigma)");

        alpha = rho1 / sigma;


        backend::axpby(alpha, *U[0], one, *X);


        for (int i = 0; i <= j; ++i)

          backend::axpby(-alpha, *U[i + 1], one, *R[i]);


        preconditioner_spmv(prm.pside, P, A, *R[j], *R[j + 1], *T);


        zeta = norm(*R[0]);


        rnmax_computed = std::max(zeta, rnmax_computed);

        rnmax_true = std::max(zeta, rnmax_true);


        // Check for early exit

        if (zeta < eps) {

          iter += j + 1;

          goto done;

        }

      }


      // Polynomial part

      for (int i = 0; i <= L; ++i) {

        for (int j = 0; j <= i; ++j) {

          MZa(i, j) = inner_product(*R[i], *R[j]);

        }

      }


      // Symmetrize MZa

      for (int i = 0; i <= L; ++i) {

        for (int j = i + 1; j <= L; ++j) {

          MZa(i, j) = MZa(j, i) = math::adjoint(MZa(j, i));

        }

      }


      std::copy(MZa.data(), MZa.data() + MZa.size(), MZb.data());


      if (prm.convex || L == 1) {

        Y0[0] = -one;


        qr.solve(L, L, MZa.stride(0), MZa.stride(1),

                 &MZa(1, 1), &MZb(0, 1), &Y0[1]);

      }

      else {

        Y0[0] = -one;

        Y0[L] = zero;

        qr.solve(L - 1, L - 1, MZa.stride(0), MZa.stride(1),

                 &MZa(1, 1), &MZb(0, 1), &Y0[1]);


        YL[0] = zero;

        YL[L] = -one;

        qr.solve(L - 1, L - 1, MZa.stride(0), MZa.stride(1),

                 &MZa(1, 1), &MZb(L, 1), &YL[1], /*computed=*/true);


        coef_type dot0 = zero;

        coef_type dot1 = zero;

        coef_type dotA = zero;

        for (int i = 0; i <= L; ++i) {

          coef_type s0 = zero;

          coef_type sL = zero;


          for (int j = 0; j <= L; ++j) {

            coef_type M = MZb(i, j);

            s0 += M * Y0[j];

            sL += M * YL[j];

          }


          dot0 += Y0[i] * s0;

          dotA += YL[i] * s0;

          dot1 += YL[i] * sL;

        }


        scalar_type kappa0 = sqrt(std::abs(std::real(dot0)));

        scalar_type kappa1 = sqrt(std::abs(std::real(dot1)));

        scalar_type kappaA = std::real(dotA);


        if (!math::is_zero(kappa0) && !math::is_zero(kappa1)) {

          scalar_type ghat;

          if (kappaA < 0.7 * kappa0 * kappa1) {

            ghat = (kappaA < 0) ? -0.7 * kappa0 / kappa1 : 0.7 * kappa0 / kappa1;

          }

          else {

            ghat = kappaA / (kappa1 * kappa1);

          }


          for (int i = 0; i <= L; ++i)

            Y0[i] -= ghat * YL[i];

        }

      }


      omega = Y0[L];

      for (int h = L; h > 0 && math::is_zero(omega); --h)

        omega = Y0[h];

      precondition(!math::is_zero(omega), "BiCGStab(L) breakdown: diverged (zero omega)");


      backend::lin_comb(L, &Y0[1], &R[0], one, *X);


      for (int i = 1; i <= L; ++i)

        Y0[i] = -one * Y0[i];


      backend::lin_comb(L, &Y0[1], &U[1], one, *U[0]);

      backend::lin_comb(L, &Y0[1], &R[1], one, *R[0]);


      for (int i = 1; i <= L; ++i)

        Y0[i] = -one * Y0[i];


      zeta = norm(*R[0]);


      // Accurate update

      if (prm.delta > 0) {

        rnmax_computed = std::max(zeta, rnmax_computed);

        rnmax_true = std::max(zeta, rnmax_true);


        bool update_x = zeta < prm.delta * zeta0 && zeta0 <= rnmax_computed;


        if ((zeta < prm.delta * rnmax_true && zeta <= rnmax_true) || update_x) {

          preconditioner_spmv(prm.pside, P, A, *X, *R[0], *T);

          backend::axpby(one, *B, -one, *R[0]);

          rnmax_true = zeta;


          if (update_x) {

            if (prm.pside == ePreconditionerSideType::left) {

              backend::axpby(one, *X, one, x);

            }

            else {

              backend::axpby(one, *T, one, x);

            }

            backend::clear(*X);

            backend::copy(*R[0], *B);


            rnmax_computed = zeta;

          }

        }

      }

      if (prm.verbose && iter % 5 == 0)

        std::cout << iter << "\t" << std::scientific << zeta / norm_rhs << std::endl;

    }


  done:

    if (prm.pside == ePreconditionerSideType::left) {

      backend::axpby(one, *X, one, x);

    }

    else {

      P.apply(*X, *T);

      backend::axpby(one, *T, one, x);

    }


    return SolverResult(iter, zeta / norm_rhs);

  }


  template <class Precond, class Vec1, class Vec2>


  SolverResult operator()(const Precond& P, const Vec1& rhs, Vec2&& x) const

  {

    return (*this)(P.system_matrix(), P, rhs, x);

  }


  size_t bytes() const

  {

    size_t b = 0;


    b += backend::bytes(*Rt);

    b += backend::bytes(*X);

    b += backend::bytes(*B);

    b += backend::bytes(*T);


    for (const auto& v : R)

      b += backend::bytes(*v);

    for (const auto& v : U)

      b += backend::bytes(*v);


    b += MZa.size() * sizeof(coef_type);

    b += MZb.size() * sizeof(coef_type);


    b += backend::bytes(Y0);

    b += backend::bytes(YL);


    b += qr.bytes();


    return b;

  }


  friend std::ostream& operator<<(std::ostream& os, const BiCGStabLSolver& s)

  {

    return os << "Type:             BiCGStab(" << s.prm.L << ")"

              << "\nUnknowns:         " << s.n

              << "\nMemory footprint: " << human_readable_memory(s.bytes())

              << std::endl;

  }


 public:


  params prm;


 private:


  size_t n;


  mutable std::shared_ptr<vector> Rt;

  mutable std::shared_ptr<vector> X;

  mutable std::shared_ptr<vector> B;

  mutable std::shared_ptr<vector> T;


  mutable std::vector<std::shared_ptr<vector>> R;

  mutable std::vector<std::shared_ptr<vector>> U;


  mutable multi_array<coef_type, 2> MZa, MZb;

  mutable std::vector<coef_type> Y0, YL;

  mutable Alina::detail::QRFactorization<coef_type> qr;


  InnerProduct inner_product;


  template <class Vec>

  scalar_type norm(const Vec& x) const

  {

    return sqrt(math::norm(inner_product(x, x)));

  }

};


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


} // namespace Arcane::Alina


/*---------------------------------------------------------------------------*/

/*---------------------------------------------------------------------------*/


#endif

Arcane::Alina::BiCGStabLSolver
BiCGStab(L) method.
Definition BiCGStabLSolver.h:152

Arcane::Alina::BiCGStabLSolver::bytes
size_t bytes() const
Memory used in bytes.
Definition BiCGStabLSolver.h:444

Arcane::Alina::BiCGStabLSolver::BiCGStabLSolver
BiCGStabLSolver(size_t n, const params &prm=params(), const backend_params &backend_prm=backend_params(), const InnerProduct &inner_product=InnerProduct())
Preallocates necessary data structures for the system of size n.
Definition BiCGStabLSolver.h:170

Arcane::Alina::BiCGStabLSolver::operator()
SolverResult operator()(const Precond &P, const Vec1 &rhs, Vec2 &&x) const
Computes the solution for the given right-hand side.
Definition BiCGStabLSolver.h:439

Arcane::Alina::PropertyTree
Definition AlinaUtils.h:106

Arcane::Alina::ScopedStreamModifier
Save ostream flags in constructor, restore in destructor.
Definition ScopedStreamModifier.h:40

Arcane::Alina::SolverBase
Base class for solvers.
Definition SolverBase.h:31

Arcane::Alina::SolverResult
Result of a solving.
Definition AlinaUtils.h:52

Arcane::Alina::detail::QRFactorization
Definition QRFactorizationImpl.h:123

Arcane::Matrix
Matrix class, to be used by user.
Definition matrix/Matrix.h:36

Arcane::math::sqrt
__host__ __device__ double sqrt(double v)
Racine carrée de v.
Definition Math.h:135

Arcane::Int32
std::int32_t Int32
Type entier signé sur 32 bits.
Definition ArccoreGlobal.h:225

Arcane::Alina::BiCGStabLSolverParams
Parameters for BiCGStab(L) solver.
Definition BiCGStabLSolver.h:79

Arcane::Alina::BiCGStabLSolverParams::ns_search
bool ns_search
Ignore the trivial solution x=0 when rhs is zero.
Definition BiCGStabLSolver.h:109

Arcane::Alina::BiCGStabLSolverParams::verbose
bool verbose
Verbose output (show iterations and error)
Definition BiCGStabLSolver.h:112

Arcane::Alina::math::inner_product_impl
Default implementation for inner product.
Definition ValueTypeInterface.h:92