doxygen/5.1.0/_nek_lin_sys_iter_c_g_8cpp_source.html

 ///////////////////////////////////////////////////////////////////////////////

 //

 // File:  NekLinSysIterCG.cpp

 //

 // For more information, please see: http://www.nektar.info

 //

 // The MIT License

 //

 // Copyright (c) 2006 Division of Applied Mathematics, Brown University (USA),

 // Department of Aeronautics, Imperial College London (UK), and Scientific

 // Computing and Imaging Institute, University of Utah (USA).

 //

 // License for the specific language governing rights and limitations under

 // Permission is hereby granted, free of charge, to any person obtaining a

 // copy of this software and associated documentation files (the "Software"),

 // to deal in the Software without restriction, including without limitation

 // the rights to use, copy, modify, merge, publish, distribute, sublicense,

 // and/or sell copies of the Software, and to permit persons to whom the

 // Software is furnished to do so, subject to the following conditions:

 //

 // The above copyright notice and this permission notice shall be included

 // in all copies or substantial portions of the Software.

 //

 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS

 // OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

 // THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

 // FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

 // DEALINGS IN THE SOFTWARE.

 //

 // Description:  NekLinSysIterCG definition

 //

 ///////////////////////////////////////////////////////////////////////////////


 #include <LibUtilities/BasicUtils/Timer.h>

 #include <LibUtilities/LinearAlgebra/NekLinSysIterCG.h>


 using namespace std;


 namespace Nektar

 {

 namespace LibUtilities

 {

 /**

  * @class  NekLinSysIterCG

  *

  * Solves a linear system using iterative methods.

  */

 string NekLinSysIterCG::className =

     LibUtilities::GetNekLinSysIterFactory().RegisterCreatorFunction(

         "ConjugateGradient", NekLinSysIterCG::create,

         "NekLinSysIterCG solver.");


 NekLinSysIterCG::NekLinSysIterCG(

     const LibUtilities::SessionReaderSharedPtr &pSession,

     const LibUtilities::CommSharedPtr &vComm, const int nDimen,

     const NekSysKey &pKey)

     : NekLinSysIter(pSession, vComm, nDimen, pKey)

 {

 }


 void NekLinSysIterCG::v_InitObject()

 {

     NekLinSysIter::v_InitObject();

 }


 NekLinSysIterCG::~NekLinSysIterCG()

 {

 }


 /**

  *

  */

 int NekLinSysIterCG::v_SolveSystem(const int nGlobal,

                                    const Array<OneD, const NekDouble> &pInput,

                                    Array<OneD, NekDouble> &pOutput,

                                    const int nDir, const NekDouble tol,

                                    const NekDouble factor)

 {

     boost::ignore_unused(tol);


     m_tolerance   = max(tol, 1.0E-16);

     m_prec_factor = factor;


     DoConjugateGradient(nGlobal, pInput, pOutput, nDir);


     return m_totalIterations;

 }


 /**

  * Solve a global linear system using the conjugate gradient method.

  * We solve only for the non-Dirichlet modes. The operator is evaluated

  * using an auxiliary function m_operator.DoNekSysLhsEval defined by the

  * specific solver. Distributed math routines are used to support

  * parallel execution of the solver.

  *

  * The implemented algorithm uses a reduced-communication reordering of

  * the standard PCG method (Demmel, Heath and Vorst, 1993)

  *

  * @param       pInput      Input residual  of all DOFs.

  * @param       pOutput     Solution vector of all DOFs.

  */

 void NekLinSysIterCG::DoConjugateGradient(

     const int nGlobal, const Array<OneD, const NekDouble> &pInput,

     Array<OneD, NekDouble> &pOutput, const int nDir)

 {

     // Get vector sizes

     int nNonDir = nGlobal - nDir;


     // Allocate array storage

     Array<OneD, NekDouble> w_A(nGlobal, 0.0);

     Array<OneD, NekDouble> s_A(nGlobal, 0.0);

     Array<OneD, NekDouble> p_A(nNonDir, 0.0);

     Array<OneD, NekDouble> r_A(nNonDir, 0.0);

     Array<OneD, NekDouble> q_A(nNonDir, 0.0);

     Array<OneD, NekDouble> tmp;


     // Create NekVector wrappers for linear algebra operations

     NekVector<NekDouble> in(nNonDir, pInput + nDir, eWrapper);

     NekVector<NekDouble> out(nNonDir, tmp = pOutput + nDir, eWrapper);

     NekVector<NekDouble> w(nNonDir, tmp = w_A + nDir, eWrapper);

     NekVector<NekDouble> s(nNonDir, tmp = s_A + nDir, eWrapper);

     NekVector<NekDouble> p(nNonDir, p_A, eWrapper);

     NekVector<NekDouble> r(nNonDir, r_A, eWrapper);

     NekVector<NekDouble> q(nNonDir, q_A, eWrapper);


     int k;

     NekDouble alpha;

     NekDouble beta;

     NekDouble rho;

     NekDouble rho_new;

     NekDouble mu;

     NekDouble eps;

     NekDouble min_resid;

     Array<OneD, NekDouble> vExchange(3, 0.0);


     // Copy initial residual from input

     r = in;

     // zero homogeneous out array ready for solution updates

     // Should not be earlier in case input vector is same as

     // output and above copy has been peformed

     Vmath::Zero(nNonDir, tmp = pOutput + nDir, 1);


     // evaluate initial residual error for exit check

     vExchange[2] = Vmath::Dot2(nNonDir, r_A, r_A, m_map + nDir);


     m_Comm->AllReduce(vExchange, Nektar::LibUtilities::ReduceSum);


     eps = vExchange[2];


     if (m_rhs_magnitude == NekConstants::kNekUnsetDouble)

     {

         NekVector<NekDouble> inGlob(nGlobal, pInput, eWrapper);

         Set_Rhs_Magnitude(inGlob);

     }


     m_totalIterations = 0;


     // If input residual is less than tolerance skip solve.

     if (eps < m_tolerance * m_tolerance * m_rhs_magnitude)

     {

         if (m_verbose && m_root)

         {

             cout << "CG iterations made = " << m_totalIterations

                  << " using tolerance of " << m_tolerance

                  << " (error = " << sqrt(eps / m_rhs_magnitude)

                  << ", rhs_mag = " << sqrt(m_rhs_magnitude) << ")" << endl;

         }

         return;

     }


     m_operator.DoNekSysPrecon(r_A, tmp = w_A + nDir);


     m_operator.DoNekSysLhsEval(w_A, s_A);


     k = 0;


     vExchange[0] = Vmath::Dot2(nNonDir, r_A, w_A + nDir, m_map + nDir);


     vExchange[1] = Vmath::Dot2(nNonDir, s_A + nDir, w_A + nDir, m_map + nDir);


     m_Comm->AllReduce(vExchange, Nektar::LibUtilities::ReduceSum);


     rho               = vExchange[0];

     mu                = vExchange[1];

     min_resid         = m_rhs_magnitude;

     beta              = 0.0;

     alpha             = rho / mu;

     m_totalIterations = 1;


     // Continue until convergence

     while (true)

     {

         if (k >= m_maxiter)

         {

             if (m_root)

             {

                 cout << "CG iterations made = " << m_totalIterations

                      << " using tolerance of " << m_tolerance

                      << " (error = " << sqrt(eps / m_rhs_magnitude)

                      << ", rhs_mag = " << sqrt(m_rhs_magnitude) << ")" << endl;

             }

             ROOTONLY_NEKERROR(ErrorUtil::efatal,

                               "Exceeded maximum number of iterations");

         }


         // Compute new search direction p_k, q_k

         Vmath::Svtvp(nNonDir, beta, &p_A[0], 1, &w_A[nDir], 1, &p_A[0], 1);

         Vmath::Svtvp(nNonDir, beta, &q_A[0], 1, &s_A[nDir], 1, &q_A[0], 1);


         // Update solution x_{k+1}

         Vmath::Svtvp(nNonDir, alpha, &p_A[0], 1, &pOutput[nDir], 1,

                      &pOutput[nDir], 1);


         // Update residual vector r_{k+1}

         Vmath::Svtvp(nNonDir, -alpha, &q_A[0], 1, &r_A[0], 1, &r_A[0], 1);


         // Apply preconditioner

         m_operator.DoNekSysPrecon(r_A, tmp = w_A + nDir);


         // Perform the method-specific matrix-vector multiply operation.

         m_operator.DoNekSysLhsEval(w_A, s_A);


         // <r_{k+1}, w_{k+1}>

         vExchange[0] = Vmath::Dot2(nNonDir, r_A, w_A + nDir, m_map + nDir);

         // <s_{k+1}, w_{k+1}>

         vExchange[1] =

             Vmath::Dot2(nNonDir, s_A + nDir, w_A + nDir, m_map + nDir);


         // <r_{k+1}, r_{k+1}>

         vExchange[2] = Vmath::Dot2(nNonDir, r_A, r_A, m_map + nDir);


         // Perform inner-product exchanges

         m_Comm->AllReduce(vExchange, Nektar::LibUtilities::ReduceSum);


         rho_new = vExchange[0];

         mu      = vExchange[1];

         eps     = vExchange[2];


         m_totalIterations++;


         // Test if norm is within tolerance

         if (eps < m_tolerance * m_tolerance * m_rhs_magnitude)

         {

             if (m_verbose && m_root)

             {

                 cout << "CG iterations made = " << m_totalIterations

                      << " using tolerance of " << m_tolerance

                      << " (error = " << sqrt(eps / m_rhs_magnitude)

                      << ", rhs_mag = " << sqrt(m_rhs_magnitude) << ")" << endl;

             }

             break;

         }

         min_resid = min(min_resid, eps);


         // Compute search direction and solution coefficients

         beta  = rho_new / rho;

         alpha = rho_new / (mu - rho_new * beta / alpha);

         rho   = rho_new;

         k++;

     }

 }

 } // namespace LibUtilities

 } // namespace Nektar

ROOTONLY_NEKERROR
#define ROOTONLY_NEKERROR(type, msg)
Definition: ErrorUtil.hpp:213

NekLinSysIterCG.h

Timer.h

Nektar::Array
Definition: SharedArray.hpp:54

Nektar::ErrorUtil::efatal
@ efatal
Definition: ErrorUtil.hpp:69

Nektar::LibUtilities::NekFactory::RegisterCreatorFunction
tKey RegisterCreatorFunction(tKey idKey, CreatorFunction classCreator, std::string pDesc="")
Register a class with the factory.
Definition: NekFactory.hpp:200

Nektar::LibUtilities::NekLinSysIterCG::DoConjugateGradient
void DoConjugateGradient(const int pNumRows, const Array< OneD, const NekDouble > &pInput, Array< OneD, NekDouble > &pOutput, const int pNumDir)
Actual iterative solve.
Definition: NekLinSysIterCG.cpp:104

Nektar::LibUtilities::NekLinSysIterCG::v_InitObject
virtual void v_InitObject()
Definition: NekLinSysIterCG.cpp:63

Nektar::LibUtilities::NekLinSysIterCG::~NekLinSysIterCG
~NekLinSysIterCG()
Definition: NekLinSysIterCG.cpp:68

Nektar::LibUtilities::NekLinSysIterCG::v_SolveSystem
virtual int v_SolveSystem(const int nGlobal, const Array< OneD, const NekDouble > &pInput, Array< OneD, NekDouble > &pOutput, const int nDir, const NekDouble tol, const NekDouble factor)
Definition: NekLinSysIterCG.cpp:75

Nektar::LibUtilities::NekLinSysIter
Definition: NekLinSysIter.h:58

Nektar::LibUtilities::NekLinSysIter::m_prec_factor
NekDouble m_prec_factor
Definition: NekLinSysIter.h:109

Nektar::LibUtilities::NekLinSysIter::m_totalIterations
int m_totalIterations
Definition: NekLinSysIter.h:106

Nektar::LibUtilities::NekLinSysIter::m_rhs_magnitude
NekDouble m_rhs_magnitude
Dot product of rhs to normalise stopping criterion.
Definition: NekLinSysIter.h:104

Nektar::LibUtilities::NekLinSysIter::Set_Rhs_Magnitude
void Set_Rhs_Magnitude(const NekVector< NekDouble > &pIn)
Definition: NekLinSysIter.cpp:128

Nektar::LibUtilities::NekLinSysIter::v_InitObject
virtual void v_InitObject()
Definition: NekLinSysIter.cpp:103

Nektar::LibUtilities::NekLinSysIter::m_map
Array< OneD, int > m_map
Global to universal unique map.
Definition: NekLinSysIter.h:101

Nektar::LibUtilities::NekSys::m_root
bool m_root
Root if parallel.
Definition: NekSys.h:289

Nektar::LibUtilities::NekSys::m_verbose
bool m_verbose
Verbose.
Definition: NekSys.h:291

Nektar::LibUtilities::NekSys::m_tolerance
NekDouble m_tolerance
Tolerance of iterative solver.
Definition: NekSys.h:283

Nektar::LibUtilities::NekSys::m_operator
NekSysOperators m_operator
Operators.
Definition: NekSys.h:294

Nektar::LibUtilities::NekSys::m_Comm
LibUtilities::CommSharedPtr m_Comm
Communicate.
Definition: NekSys.h:285

Nektar::LibUtilities::NekSys::m_maxiter
int m_maxiter
Maximum iterations.
Definition: NekSys.h:281

Nektar::LibUtilities::NekSysKey
Definition: NekSys.h:188

Nektar::LibUtilities::NekSysOperators::DoNekSysPrecon
void DoNekSysPrecon(InArrayType &inarray, OutArrayType &outarray, const bool &flag=false) const
Definition: NekSys.h:142

Nektar::LibUtilities::NekSysOperators::DoNekSysLhsEval
void DoNekSysLhsEval(InArrayType &inarray, OutArrayType &outarray, const bool &flag=false) const
Definition: NekSys.h:135

Nektar::NekVector
Definition: NekVector.hpp:57

CellMLToNektar.cellml_metadata.p
p
Definition: cellml_metadata.py:350

Nektar::LibUtilities::SessionReaderSharedPtr
std::shared_ptr< SessionReader > SessionReaderSharedPtr
Definition: SessionReader.h:120

Nektar::LibUtilities::GetNekLinSysIterFactory
NekLinSysIterFactory & GetNekLinSysIterFactory()
Definition: NekLinSysIter.cpp:50

Nektar::LibUtilities::ReduceSum
@ ReduceSum
Definition: Comm.h:68

Nektar::LibUtilities::CommSharedPtr
std::shared_ptr< Comm > CommSharedPtr
Pointer to a Communicator object.
Definition: Comm.h:54

Nektar::NekConstants::kNekUnsetDouble
static const NekDouble kNekUnsetDouble
Definition: NektarUnivConsts.hpp:47

Nektar
The above copyright notice and this permission notice shall be included.
Definition: CoupledSolver.h:1

Nektar::NekDouble
double NekDouble
Definition: NektarUnivTypeDefs.hpp:43

Nektar::eWrapper
@ eWrapper
Definition: PointerWrapper.h:44

Vmath::Svtvp
void Svtvp(int n, const T alpha, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
svtvp (scalar times vector plus vector): z = alpha*x + y
Definition: Vmath.cpp:565

Vmath::Dot2
T Dot2(int n, const T *w, const T *x, const int *y)
vvtvp (vector times vector times vector): z = w*x*y
Definition: Vmath.cpp:1084

Vmath::Zero
void Zero(int n, T *x, const int incx)
Zero vector.
Definition: Vmath.cpp:436

tinysimd::sqrt
scalarT< T > sqrt(scalarT< T > in)
Definition: scalar.hpp:267