228 static const scalar_type zero = math::zero<scalar_type>();
229 static const scalar_type one = math::identity<scalar_type>();
233 if (prm.always_reset) {
237 scalar_type norm_rhs = norm(rhs);
238 if (norm_rhs < Alina::detail::eps<scalar_type>(1)) {
240 norm_rhs = math::identity<scalar_type>();
248 scalar_type norm_r = zero;
249 scalar_type eps = std::max(prm.tol * norm_rhs, prm.abstol);
252 unsigned n_outer = 0;
254 if (prm.pside == ePreconditionerSideType::left) {
255 backend::residual(rhs, A, x, *vs[0]);
259 backend::residual(rhs, A, x, *r);
264 if (norm_r < eps || iter >= prm.maxiter)
268 backend::axpby(math::inverse(norm_r), *r, zero, *vs[0]);
270 std::fill(s.begin(), s.end(), 0);
305 vector& v_new = *vs[j + 1];
307 std::shared_ptr<vector> z;
308 if (j >= M - outer_v.size()) {
309 z = outer_v[j - (M - outer_v.size())];
317 preconditioner_spmv(prm.pside, P, A, *z, v_new, *r);
319 for (
unsigned k = 0; k <= j; ++k) {
320 H0(k, j) = H(k, j) = inner_product(v_new, *vs[k]);
321 backend::axpby(-H(k, j), *vs[k], one, v_new);
323 H0(j + 1, j) = H(j + 1, j) = norm(v_new);
325 backend::axpby(math::inverse(H(j + 1, j)), v_new, zero, v_new);
327 for (
unsigned k = 0; k < j; ++k)
328 detail::apply_plane_rotation(H(k, j), H(k + 1, j), cs[k], sn[k]);
330 detail::generate_plane_rotation(H(j, j), H(j + 1, j), cs[j], sn[j]);
331 detail::apply_plane_rotation(H(j, j), H(j + 1, j), cs[j], sn[j]);
332 detail::apply_plane_rotation(s[j], s[j + 1], cs[j], sn[j]);
334 scalar_type inner_res = std::abs(s[j + 1]);
336 if (prm.verbose && iter % 5 == 0)
337 std::cout << iter <<
"\t" << std::scientific << inner_res / norm_rhs << std::endl;
341 if (iter >= prm.maxiter || j >= M || inner_res <= eps)
346 for (
unsigned i = j; i-- > 0;) {
348 for (
unsigned k = 0; k < i; ++k)
349 s[k] -= H(k, i) * s[i];
353 backend::lin_comb(j, s, ws, zero, dx);
356 if (prm.pside == ePreconditionerSideType::left) {
357 backend::axpby(one, dx, one, x);
360 vector& tmp = *ws[0];
362 backend::axpby(one, tmp, one, x);
366 scalar_type norm_dx = norm(dx);
368 if (prm.K > 0 && !math::is_zero(norm_dx)) {
369 unsigned outer_slot = n_outer % prm.K;
372 norm_dx = math::inverse(norm_dx);
373 backend::axpby(norm_dx, dx, zero, *outer_v_data[outer_slot]);
374 outer_v.push_back(outer_v_data[outer_slot]);