doxygen/5.4.0/_nek_lin_sys_iter_c_g_8cpp_source.html

///////////////////////////////////////////////////////////////////////////////

//

// File: NekLinSysIterCG.cpp

//

// For more information, please see: http://www.nektar.info

//

// The MIT License

//

// Copyright (c) 2006 Division of Applied Mathematics, Brown University (USA),

// Department of Aeronautics, Imperial College London (UK), and Scientific

// Computing and Imaging Institute, University of Utah (USA).

//

// License for the specific language governing rights and limitations under

// Permission is hereby granted, free of charge, to any person obtaining a

// copy of this software and associated documentation files (the "Software"),

// to deal in the Software without restriction, including without limitation

// the rights to use, copy, modify, merge, publish, distribute, sublicense,

// and/or sell copies of the Software, and to permit persons to whom the

// Software is furnished to do so, subject to the following conditions:

//

// The above copyright notice and this permission notice shall be included

// in all copies or substantial portions of the Software.

//

// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS

// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

// DEALINGS IN THE SOFTWARE.

//

// Description: NekLinSysIterCG definition

//

///////////////////////////////////////////////////////////////////////////////


#include <LibUtilities/BasicUtils/Timer.h>

#include <LibUtilities/LinearAlgebra/NekLinSysIterCG.h>


using namespace std;


namespace Nektar

{

namespace LibUtilities

{

/**

 * @class  NekLinSysIterCG

 *

 * Solves a linear system using iterative methods.

 */

string NekLinSysIterCG::className =

    LibUtilities::GetNekLinSysIterFactory().RegisterCreatorFunction(

        "ConjugateGradient", NekLinSysIterCG::create,

        "NekLinSysIterCG solver.");


NekLinSysIterCG::NekLinSysIterCG(

    const LibUtilities::SessionReaderSharedPtr &pSession,

    const LibUtilities::CommSharedPtr &vRowComm, const int nDimen,

    const NekSysKey &pKey)

    : NekLinSysIter(pSession, vRowComm, nDimen, pKey)

{

}


void NekLinSysIterCG::v_InitObject()

{

    NekLinSysIter::v_InitObject();

}


NekLinSysIterCG::~NekLinSysIterCG()

{

}


/**

 *

 */

int NekLinSysIterCG::v_SolveSystem(const int nGlobal,

                                   const Array<OneD, const NekDouble> &pInput,

                                   Array<OneD, NekDouble> &pOutput,

                                   const int nDir, const NekDouble tol,

                                   const NekDouble factor)

{

    m_tolerance   = max(tol, 1.0E-16);

    m_prec_factor = factor;


    DoConjugateGradient(nGlobal, pInput, pOutput, nDir);


    return m_totalIterations;

}


/**

 * Solve a global linear system using the conjugate gradient method.

 * We solve only for the non-Dirichlet modes. The operator is evaluated

 * using an auxiliary function m_operator.DoNekSysLhsEval defined by the

 * specific solver. Distributed math routines are used to support

 * parallel execution of the solver.

 *

 * The implemented algorithm uses a reduced-communication reordering of

 * the standard PCG method (Demmel, Heath and Vorst, 1993)

 *

 * @param       pInput      Input residual  of all DOFs.

 * @param       pOutput     Solution vector of all DOFs.

 */

void NekLinSysIterCG::DoConjugateGradient(

    const int nGlobal, const Array<OneD, const NekDouble> &pInput,

    Array<OneD, NekDouble> &pOutput, const int nDir)

{

    // Get vector sizes

    int nNonDir = nGlobal - nDir;


    // Allocate array storage

    Array<OneD, NekDouble> w_A(nGlobal, 0.0);

    Array<OneD, NekDouble> s_A(nGlobal, 0.0);

    Array<OneD, NekDouble> p_A(nNonDir, 0.0);

    Array<OneD, NekDouble> r_A(nNonDir, 0.0);

    Array<OneD, NekDouble> q_A(nNonDir, 0.0);

    Array<OneD, NekDouble> tmp;


    NekDouble alpha;

    NekDouble beta;

    NekDouble rho;

    NekDouble rho_new;

    NekDouble mu;

    NekDouble eps;

    Array<OneD, NekDouble> vExchange(3, 0.0);


    // Copy initial residual from input

    Vmath::Vcopy(nNonDir, pInput + nDir, 1, r_A, 1);


    // Zero homogeneous out array ready for solution updates

    // Should not be earlier in case input vector is same as

    // output and above copy has been peformed

    Vmath::Zero(nNonDir, tmp = pOutput + nDir, 1);


    // Evaluate initial residual error for exit check

    vExchange[2] = Vmath::Dot2(nNonDir, r_A, r_A, m_map + nDir);


    m_rowComm->AllReduce(vExchange[2], Nektar::LibUtilities::ReduceSum);


    eps = vExchange[2];


    if (m_rhs_magnitude == NekConstants::kNekUnsetDouble)

    {

        NekVector<NekDouble> inGlob(nGlobal, pInput, eWrapper);

        Set_Rhs_Magnitude(inGlob);

    }


    m_totalIterations = 0;


    // If input residual is less than tolerance skip solve.

    if (eps < m_tolerance * m_tolerance * m_rhs_magnitude)

    {

        if (m_verbose && m_root)

        {

            cout << "CG iterations made = " << m_totalIterations

                 << " using tolerance of " << m_tolerance

                 << " (error = " << sqrt(eps / m_rhs_magnitude)

                 << ", rhs_mag = " << sqrt(m_rhs_magnitude) << ")" << endl;

        }

        return;

    }


    m_operator.DoNekSysPrecon(r_A, tmp = w_A + nDir);


    m_operator.DoNekSysLhsEval(w_A, s_A);


    vExchange[0] = Vmath::Dot2(nNonDir, r_A, w_A + nDir, m_map + nDir);


    vExchange[1] = Vmath::Dot2(nNonDir, s_A + nDir, w_A + nDir, m_map + nDir);


    m_rowComm->AllReduce(vExchange, Nektar::LibUtilities::ReduceSum);


    rho               = vExchange[0];

    mu                = vExchange[1];

    beta              = 0.0;

    alpha             = rho / mu;

    m_totalIterations = 1;


    // Continue until convergence

    while (true)

    {

        if (m_totalIterations > m_maxiter)

        {

            if (m_root)

            {

                cout << "CG iterations made = " << m_totalIterations

                     << " using tolerance of " << m_tolerance

                     << " (error = " << sqrt(eps / m_rhs_magnitude)

                     << ", rhs_mag = " << sqrt(m_rhs_magnitude) << ")" << endl;

            }

            ROOTONLY_NEKERROR(ErrorUtil::efatal,

                              "Exceeded maximum number of iterations");

        }


        // Compute new search direction p_k, q_k

        Vmath::Svtvp(nNonDir, beta, &p_A[0], 1, &w_A[nDir], 1, &p_A[0], 1);

        Vmath::Svtvp(nNonDir, beta, &q_A[0], 1, &s_A[nDir], 1, &q_A[0], 1);


        // Update solution x_{k+1}

        Vmath::Svtvp(nNonDir, alpha, &p_A[0], 1, &pOutput[nDir], 1,

                     &pOutput[nDir], 1);


        // Update residual vector r_{k+1}

        Vmath::Svtvp(nNonDir, -alpha, &q_A[0], 1, &r_A[0], 1, &r_A[0], 1);


        // Apply preconditioner

        m_operator.DoNekSysPrecon(r_A, tmp = w_A + nDir);


        // Perform the method-specific matrix-vector multiply operation.

        m_operator.DoNekSysLhsEval(w_A, s_A);


        // <r_{k+1}, w_{k+1}>

        vExchange[0] = Vmath::Dot2(nNonDir, r_A, w_A + nDir, m_map + nDir);


        // <s_{k+1}, w_{k+1}>

        vExchange[1] =

            Vmath::Dot2(nNonDir, s_A + nDir, w_A + nDir, m_map + nDir);


        // <r_{k+1}, r_{k+1}>

        vExchange[2] = Vmath::Dot2(nNonDir, r_A, r_A, m_map + nDir);


        // Perform inner-product exchanges

        m_rowComm->AllReduce(vExchange, Nektar::LibUtilities::ReduceSum);


        rho_new = vExchange[0];

        mu      = vExchange[1];

        eps     = vExchange[2];


        m_totalIterations++;


        // Test if norm is within tolerance

        if (eps < m_tolerance * m_tolerance * m_rhs_magnitude)

        {

            if (m_verbose && m_root)

            {

                cout << "CG iterations made = " << m_totalIterations

                     << " using tolerance of " << m_tolerance

                     << " (error = " << sqrt(eps / m_rhs_magnitude)

                     << ", rhs_mag = " << sqrt(m_rhs_magnitude) << ")" << endl;

            }

            break;

        }


        // Compute search direction and solution coefficients

        beta  = rho_new / rho;

        alpha = rho_new / (mu - rho_new * beta / alpha);

        rho   = rho_new;

    }

}

} // namespace LibUtilities

} // namespace Nektar

ROOTONLY_NEKERROR
#define ROOTONLY_NEKERROR(type, msg)
Definition: ErrorUtil.hpp:212

NekLinSysIterCG.h

Timer.h

Nektar::Array
Definition: SharedArray.hpp:53

Nektar::ErrorUtil::efatal
@ efatal
Definition: ErrorUtil.hpp:69

Nektar::LibUtilities::NekFactory::RegisterCreatorFunction
tKey RegisterCreatorFunction(tKey idKey, CreatorFunction classCreator, std::string pDesc="")
Register a class with the factory.
Definition: NekFactory.hpp:198

Nektar::LibUtilities::NekLinSysIterCG::v_InitObject
virtual void v_InitObject() override
Definition: NekLinSysIterCG.cpp:63

Nektar::LibUtilities::NekLinSysIterCG::DoConjugateGradient
void DoConjugateGradient(const int pNumRows, const Array< OneD, const NekDouble > &pInput, Array< OneD, NekDouble > &pOutput, const int pNumDir)
Actual iterative solve.
Definition: NekLinSysIterCG.cpp:102

Nektar::LibUtilities::NekLinSysIterCG::className
static std::string className
Definition: NekLinSysIterCG.h:66

Nektar::LibUtilities::NekLinSysIterCG::v_SolveSystem
virtual int v_SolveSystem(const int nGlobal, const Array< OneD, const NekDouble > &pInput, Array< OneD, NekDouble > &pOutput, const int nDir, const NekDouble tol, const NekDouble factor) override
Definition: NekLinSysIterCG.cpp:75

Nektar::LibUtilities::NekLinSysIterCG::~NekLinSysIterCG
~NekLinSysIterCG()
Definition: NekLinSysIterCG.cpp:68

Nektar::LibUtilities::NekLinSysIterCG::NekLinSysIterCG
NekLinSysIterCG(const LibUtilities::SessionReaderSharedPtr &pSession, const LibUtilities::CommSharedPtr &vRowComm, const int nDimen, const NekSysKey &pKey)
Constructor for full direct matrix solve.
Definition: NekLinSysIterCG.cpp:55

Nektar::LibUtilities::NekLinSysIterCG::create
static NekLinSysIterSharedPtr create(const LibUtilities::SessionReaderSharedPtr &pSession, const LibUtilities::CommSharedPtr &vRowComm, const int nDimen, const NekSysKey &pKey)
Definition: NekLinSysIterCG.h:55

Nektar::LibUtilities::NekLinSysIter
Definition: NekLinSysIter.h:57

Nektar::LibUtilities::NekLinSysIter::v_InitObject
virtual void v_InitObject() override
Definition: NekLinSysIter.cpp:105

Nektar::LibUtilities::NekLinSysIter::m_prec_factor
NekDouble m_prec_factor
Definition: NekLinSysIter.h:113

Nektar::LibUtilities::NekLinSysIter::m_totalIterations
int m_totalIterations
Definition: NekLinSysIter.h:110

Nektar::LibUtilities::NekLinSysIter::m_rhs_magnitude
NekDouble m_rhs_magnitude
Dot product of rhs to normalise stopping criterion.
Definition: NekLinSysIter.h:108

Nektar::LibUtilities::NekLinSysIter::Set_Rhs_Magnitude
void Set_Rhs_Magnitude(const NekVector< NekDouble > &pIn)
Definition: NekLinSysIter.cpp:130

Nektar::LibUtilities::NekLinSysIter::m_map
Array< OneD, int > m_map
Global to universal unique map.
Definition: NekLinSysIter.h:105

Nektar::LibUtilities::NekSys::m_root
bool m_root
Root if parallel.
Definition: NekSys.h:306

Nektar::LibUtilities::NekSys::m_rowComm
LibUtilities::CommSharedPtr m_rowComm
Communicate.
Definition: NekSys.h:302

Nektar::LibUtilities::NekSys::m_verbose
bool m_verbose
Verbose.
Definition: NekSys.h:308

Nektar::LibUtilities::NekSys::m_tolerance
NekDouble m_tolerance
Tolerance of iterative solver.
Definition: NekSys.h:300

Nektar::LibUtilities::NekSys::m_operator
NekSysOperators m_operator
Operators.
Definition: NekSys.h:311

Nektar::LibUtilities::NekSys::m_maxiter
int m_maxiter
Maximum iterations.
Definition: NekSys.h:298

Nektar::LibUtilities::NekSysKey
Definition: NekSys.h:210

Nektar::LibUtilities::NekSysOperators::DoNekSysPrecon
void DoNekSysPrecon(InArrayType &inarray, OutArrayType &outarray, const bool &flag=false) const
Definition: NekSys.h:150

Nektar::LibUtilities::NekSysOperators::DoNekSysLhsEval
void DoNekSysLhsEval(InArrayType &inarray, OutArrayType &outarray, const bool &flag=false) const
Definition: NekSys.h:143

Nektar::NekVector< NekDouble >

Nektar::LibUtilities::SessionReaderSharedPtr
std::shared_ptr< SessionReader > SessionReaderSharedPtr
Definition: SessionReader.h:115

Nektar::LibUtilities::GetNekLinSysIterFactory
NekLinSysIterFactory & GetNekLinSysIterFactory()
Definition: NekLinSysIter.cpp:50

Nektar::LibUtilities::ReduceSum
@ ReduceSum
Definition: Comm.h:68

Nektar::LibUtilities::beta
@ beta
Gauss Radau pinned at x=-1,.
Definition: PointsType.h:61

Nektar::LibUtilities::CommSharedPtr
std::shared_ptr< Comm > CommSharedPtr
Pointer to a Communicator object.
Definition: Comm.h:57

Nektar::NekConstants::kNekUnsetDouble
static const NekDouble kNekUnsetDouble
Definition: NektarUnivConsts.hpp:46

Nektar
The above copyright notice and this permission notice shall be included.
Definition: CoupledSolver.h:2

Nektar::NekDouble
double NekDouble
Definition: NektarUnivTypeDefs.hpp:43

Nektar::eWrapper
@ eWrapper
Definition: PointerWrapper.h:45

Vmath::Svtvp
void Svtvp(int n, const T alpha, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
svtvp (scalar times vector plus vector): z = alpha*x + y
Definition: Vmath.cpp:617

Vmath::Dot2
T Dot2(int n, const T *w, const T *x, const int *y)
dot2 (vector times vector times vector): z = w*x*y
Definition: Vmath.cpp:1142

Vmath::Zero
void Zero(int n, T *x, const int incx)
Zero vector.
Definition: Vmath.cpp:487

Vmath::Vcopy
void Vcopy(int n, const T *x, const int incx, T *y, const int incy)
Definition: Vmath.cpp:1191

tinysimd::sqrt
scalarT< T > sqrt(scalarT< T > in)
Definition: scalar.hpp:294