From 7d1f6fdae95cd758766649077ddb5e12e0659528 Mon Sep 17 00:00:00 2001 From: Christian Engwer <christi@dune-project.org> Date: Fri, 20 Nov 2015 00:53:51 +0100 Subject: [PATCH] [solvers] rewrite the solvers to work with the simd infrastructure Currently RestartedGMRes and MINRes don't work with multiple rhs, as it is not straight forward to rewrite the Givens-rotation in a vectorized way. --- dune/istl/solvers.hh | 87 +++++++++++++++++++++++--------------------- 1 file changed, 46 insertions(+), 41 deletions(-) diff --git a/dune/istl/solvers.hh b/dune/istl/solvers.hh index 38080e797..ec59f7eeb 100644 --- a/dune/istl/solvers.hh +++ b/dune/istl/solvers.hh @@ -20,6 +20,8 @@ #include "preconditioner.hh" #include <dune/common/deprecated.hh> #include <dune/common/exceptions.hh> +#include <dune/common/simd.hh> +#include <dune/common/rangeutilities.hh> #include <dune/common/timer.hh> #include <dune/common/ftraits.hh> #include <dune/common/typetraits.hh> @@ -170,7 +172,7 @@ namespace Dune { this->printOutput(std::cout,i,defnew,def); //std::cout << i << " " << defnew << " " << defnew/def << std::endl; def = defnew; // update norm - if (def<def0*_reduction || def<1E-30) // convergence check + if (all_true(def<def0*_reduction) || max_value(def)<1E-30) // convergence check { res.converged = true; break; @@ -189,7 +191,7 @@ namespace Dune { // fill statistics res.iterations = i; - res.reduction = def/def0; + res.reduction = max_value(def/def0); res.conv_rate = pow(res.reduction,1.0/i); res.elapsed = watch.elapsed(); @@ -312,7 +314,7 @@ namespace Dune { this->printOutput(std::cout,i,defnew,def); def = defnew; // update norm - if (def<def0*_reduction || def<1E-30) // convergence check + if (all_true(def<def0*_reduction) || max_value(def)<1E-30) // convergence check { res.converged = true; break; @@ -327,8 +329,8 @@ namespace Dune { _prec.post(x); // postprocess preconditioner res.iterations = i; // fill statistics - res.reduction = static_cast<double>(def/def0); - res.conv_rate = static_cast<double>(pow(res.reduction,1.0/i)); + res.reduction = static_cast<double>(max_value(def/def0)); + res.conv_rate = pow(res.reduction,1.0/i); res.elapsed = watch.elapsed(); if (_verbose>0) // final print std::cout << "=== rate=" << res.conv_rate @@ -429,7 +431,7 @@ namespace Dune { real_type def0 = _sp.norm(b); // compute norm - if (!isfinite(def0)) // check for inf or NaN + if (!all_true(isfinite(def0))) // check for inf or NaN { if (_verbose>0) std::cout << "=== CGSolver: abort due to infinite or NaN initial defect" @@ -438,7 +440,7 @@ namespace Dune { << " is infinite or NaN"); } - if (def0<1E-30) // convergence check + if (max_value(def0)<1E-30) // convergence check { res.converged = true; res.iterations = 0; // fill statistics @@ -457,7 +459,7 @@ namespace Dune { std::cout << "=== CGSolver" << std::endl; if (_verbose>1) { this->printHeader(std::cout); - this->printOutput(std::cout,real_type(0),def0); + this->printOutput(std::cout,0,def0); } } @@ -485,10 +487,10 @@ namespace Dune { real_type defnew=_sp.norm(b); // comp defect norm if (_verbose>1) // print - this->printOutput(std::cout,real_type(i),defnew,def); + this->printOutput(std::cout,i,defnew,def); def = defnew; // update norm - if (!isfinite(def)) // check for inf or NaN + if (!all_true(isfinite(def))) // check for inf or NaN { if (_verbose>0) std::cout << "=== CGSolver: abort due to infinite or NaN defect" @@ -497,7 +499,7 @@ namespace Dune { "CGSolver: defect=" << def << " is infinite or NaN"); } - if (def<def0*_reduction || def<1E-30) // convergence check + if (all_true(def<def0*_reduction) || max_value(def)<1E-30) // convergence check { res.converged = true; break; @@ -517,12 +519,12 @@ namespace Dune { i=std::min(_maxit,i); if (_verbose==1) // printing for non verbose - this->printOutput(std::cout,real_type(i),def); + this->printOutput(std::cout,i,def); _prec.post(x); // postprocess preconditioner res.iterations = i; // fill statistics - res.reduction = static_cast<double>(def/def0); - res.conv_rate = static_cast<double>(pow(res.reduction,1.0/i)); + res.reduction = static_cast<double>(max_value(max_value(def/def0))); + res.conv_rate = pow(res.reduction,1.0/i); res.elapsed = watch.elapsed(); if (_verbose>0) // final print @@ -621,6 +623,7 @@ namespace Dune { { using std::abs; const real_type EPSILON=1e-80; + using std::abs; double it; field_type rho, rho_new, alpha, beta, h, omega; real_type norm, norm_old, norm_0; @@ -668,7 +671,7 @@ namespace Dune { } } - if ( norm < (_reduction * norm_0) || norm<1E-30) + if ( all_true(norm < (_reduction * norm_0)) || max_value(norm)<1E-30) { res.converged = 1; _prec.post(x); // postprocess preconditioner @@ -693,13 +696,13 @@ namespace Dune { rho_new = _sp.dot(rt,r); // look if breakdown occurred - if (abs(rho) <= EPSILON) + if (all_true(abs(rho) <= EPSILON)) DUNE_THROW(SolverAbort,"breakdown in BiCGSTAB - rho " - << rho << " <= EPSILON " << EPSILON + << rho << " <= EPSILON " << max_value(EPSILON) << " after " << it << " iterations"); - if (abs(omega) <= EPSILON) + if (all_true(abs(omega) <= EPSILON)) DUNE_THROW(SolverAbort,"breakdown in BiCGSTAB - omega " - << omega << " <= EPSILON " << EPSILON + << omega << " <= EPSILON " << max_value(EPSILON) << " after " << it << " iterations"); @@ -723,9 +726,9 @@ namespace Dune { // alpha = rho_new / < rt, v > h = _sp.dot(rt,v); - if (abs(h) < EPSILON) + if ( all_true(abs(h) < EPSILON) ) DUNE_THROW(SolverAbort,"abs(h) < EPSILON in BiCGSTAB - abs(h) " - << abs(h) << " < EPSILON " << EPSILON + << abs(h) << " < EPSILON " << max_value(EPSILON) << " after " << it << " iterations"); alpha = rho_new / h; @@ -748,7 +751,7 @@ namespace Dune { this->printOutput(std::cout,it,norm,norm_old); } - if ( norm < (_reduction * norm_0) ) + if ( all_true(norm < (_reduction * norm_0)) ) { res.converged = 1; break; @@ -787,7 +790,7 @@ namespace Dune { this->printOutput(std::cout,it,norm,norm_old); } - if ( norm < (_reduction * norm_0) || norm<1E-30) + if ( all_true(norm < (_reduction * norm_0)) || max_value(norm)<1E-30) { res.converged = 1; break; @@ -804,8 +807,8 @@ namespace Dune { _prec.post(x); // postprocess preconditioner res.iterations = static_cast<int>(std::ceil(it)); // fill statistics - res.reduction = static_cast<double>(norm/norm_0); - res.conv_rate = static_cast<double>(pow(res.reduction,1.0/it)); + res.reduction = static_cast<double>(max_value(norm/norm_0)); + res.conv_rate = pow(res.reduction,1.0/it); res.elapsed = watch.elapsed(); if (_verbose>0) // final print std::cout << "=== rate=" << res.conv_rate @@ -918,7 +921,7 @@ namespace Dune { } // check for convergence - if(def0 < 1e-30 ) { + if( max_value(def0) < 1e-30 ) { res.converged = true; res.iterations = 0; res.reduction = 0; @@ -1045,7 +1048,8 @@ namespace Dune { this->printOutput(std::cout,i,defnew,def); def = defnew; - if(def < def0*_reduction || def < 1e-30 || i == _maxit ) { + if(all_true(def < def0*_reduction) + || max_value(def) < 1e-30 || i == _maxit ) { res.converged = true; break; } @@ -1058,8 +1062,8 @@ namespace Dune { _prec.post(x); // fill statistics res.iterations = i; - res.reduction = static_cast<double>(def/def0); - res.conv_rate = static_cast<double>(pow(res.reduction,1.0/i)); + res.reduction = static_cast<double>(max_value(def/def0)); + res.conv_rate = pow(res.reduction,1.0/i); res.elapsed = watch.elapsed(); // final print @@ -1236,7 +1240,7 @@ namespace Dune { */ virtual void apply (X& x, Y& b, InverseOperatorResult& res) { - apply(x,b,_reduction,res); + apply(x,b,max_value(_reduction),res); } /*! @@ -1289,7 +1293,7 @@ namespace Dune { } } - if(norm_0 < EPSILON) { + if(all_true(norm_0 < EPSILON)) { _W.post(x); res.converged = true; if(_verbose > 0) // final print @@ -1321,7 +1325,7 @@ namespace Dune { w.axpy(-H[k][i],v[k]); } H[i+1][i] = _sp.norm(w); - if(abs(H[i+1][i]) < EPSILON) + if(all_true(abs(H[i+1][i]) < EPSILON)) DUNE_THROW(SolverAbort, "breakdown in GMRes - |w| == 0.0 after " << j << " iterations"); @@ -1349,7 +1353,7 @@ namespace Dune { norm_old = norm; // check convergence - if(norm < reduction * norm_0) + if(all_true(norm < reduction * norm_0)) res.converged = true; } // end for @@ -1385,8 +1389,8 @@ namespace Dune { // save solver statistics res.iterations = j-1; // it has to be j-1!!! - res.reduction = static_cast<double>(norm/norm_0); - res.conv_rate = static_cast<double>(pow(res.reduction,1.0/(j-1))); + res.reduction = static_cast<double>(max_value(norm/norm_0)); + res.conv_rate = pow(res.reduction,1.0/(j-1)); res.elapsed = watch.elapsed(); if(_verbose>0) @@ -1426,12 +1430,13 @@ namespace Dune { } template<typename T> - typename std::enable_if<std::is_same<field_type,real_type>::value,T>::type conjugate(const T& t) { + typename enable_if<std::is_same<field_type,real_type>::value,T>::type conjugate(const T& t) { return t; } template<typename T> - typename std::enable_if<!std::is_same<field_type,real_type>::value,T>::type conjugate(const T& t) { + typename enable_if<!std::is_same<field_type,real_type>::value,T>::type conjugate(const T& t) { + using std::conj; return conj(t); } @@ -1566,7 +1571,7 @@ namespace Dune { p[0].reset(new X(x)); real_type def0 = _sp.norm(b); // compute norm - if (def0<1E-30) // convergence check + if ( max_value(def0) < 1E-30 ) // convergence check { res.converged = true; res.iterations = 0; // fill statistics @@ -1609,7 +1614,7 @@ namespace Dune { if (_verbose>1) // print this->printOutput(std::cout,++i,defnew,def); def = defnew; // update norm - if (def<def0*_reduction || def<1E-30) // convergence check + if (all_true(def<def0*_reduction) || max_value(def)<1E-30) // convergence check { res.converged = true; if (_verbose>0) // final print @@ -1655,7 +1660,7 @@ namespace Dune { this->printOutput(std::cout,++i,defNew,def); def = defNew; // update norm - if (def<def0*_reduction || def<1E-30) // convergence check + if (all_true(def<def0*_reduction) || max_value(def)<1E-30) // convergence check { res.converged = true; break; @@ -1674,7 +1679,7 @@ namespace Dune { // fill statistics res.iterations = i; - res.reduction = def/def0; + res.reduction = max_value(def/def0); res.conv_rate = pow(res.reduction,1.0/i); res.elapsed = watch.elapsed(); -- GitLab