doxygen/5.0.1/_preconditioner_low_energy_8cpp_source.html

 ///////////////////////////////////////////////////////////////////////////////
 //
 // File Preconditioner.cpp
 //
 // For more information, please see: http://www.nektar.info
 //
 // The MIT License
 //
 // Copyright (c) 2006 Division of Applied Mathematics, Brown University (USA),
 // Department of Aeronautics, Imperial College London (UK), and Scientific
 // Computing and Imaging Institute, University of Utah (USA).
 //
 // Permission is hereby granted, free of charge, to any person obtaining a
 // copy of this software and associated documentation files (the "Software"),
 // to deal in the Software without restriction, including without limitation
 // the rights to use, copy, modify, merge, publish, distribute, sublicense,
 // and/or sell copies of the Software, and to permit persons to whom the
 // Software is furnished to do so, subject to the following conditions:
 //
 // The above copyright notice and this permission notice shall be included
 // in all copies or substantial portions of the Software.
 //
 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
 // OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
 // THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 // FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
 // DEALINGS IN THE SOFTWARE.
 //
 // Description: Preconditioner definition
 //
 ///////////////////////////////////////////////////////////////////////////////

 #include <LibUtilities/BasicUtils/VDmathArray.hpp>
 #include <MultiRegions/PreconditionerLowEnergy.h>
 #include <MultiRegions/GlobalMatrixKey.h>
 #include <MultiRegions/GlobalLinSysIterativeStaticCond.h>
 #include <MultiRegions/GlobalLinSys.h>
 #include <LocalRegions/MatrixKey.h>
 #include <math.h>

 using namespace std;

 namespace Nektar
 {
     using namespace LibUtilities;

     namespace MultiRegions
     {
         /**
          * Registers the class with the Factory.
          */
         string PreconditionerLowEnergy::className
                 = GetPreconFactory().RegisterCreatorFunction(
                     "LowEnergyBlock",
                     PreconditionerLowEnergy::create,
                     "LowEnergy Preconditioning");

        /**
          * @class PreconditionerLowEnergy
          *
          * This class implements low energy preconditioning for the conjugate
      * gradient matrix solver.
      */

         PreconditionerLowEnergy::PreconditionerLowEnergy(
             const std::shared_ptr<GlobalLinSys> &plinsys,
             const AssemblyMapSharedPtr &pLocToGloMap)
             : Preconditioner(plinsys, pLocToGloMap)
         {
         }

         void PreconditionerLowEnergy::v_InitObject()
         {
             GlobalSysSolnType solvertype =
                 m_locToGloMap.lock()->GetGlobalSysSolnType();

             ASSERTL0(solvertype == eIterativeStaticCond ||
                      solvertype == ePETScStaticCond, "Solver type not valid");

             std::shared_ptr<MultiRegions::ExpList>
                 expList=((m_linsys.lock())->GetLocMat()).lock();

             m_comm = expList->GetComm();

             LocalRegions::ExpansionSharedPtr locExpansion;

             locExpansion = expList->GetExp(0);

             int nDim = locExpansion->GetShapeDimension();

             ASSERTL0(nDim==3,
                      "Preconditioner type only valid in 3D");

             //Set up block transformation matrix
             SetupBlockTransformationMatrix();

             //Sets up multiplicity map for transformation from global to local
             CreateMultiplicityMap();
     }


         /**
      * \brief Construct the low energy preconditioner from
      * \f$\mathbf{S}_{2}\f$
      *
      * \f[\mathbf{M}^{-1}=\left[\begin{array}{ccc}
      *  Diag[(\mathbf{S_{2}})_{vv}] & & \\ & (\mathbf{S}_{2})_{eb} & \\ & &
      *  (\mathbf{S}_{2})_{fb} \end{array}\right] \f]
      *
      * where \f$\mathbf{R}\f$ is the transformation matrix and
      * \f$\mathbf{S}_{2}\f$ the Schur complement of the modified basis,
      * given by
      *
      * \f[\mathbf{S}_{2}=\mathbf{R}\mathbf{S}_{1}\mathbf{R}^{T}\f]
      *
      * where \f$\mathbf{S}_{1}\f$ is the local schur complement matrix for
      * each element.
      */
        void PreconditionerLowEnergy::v_BuildPreconditioner()
         {
             std::shared_ptr<MultiRegions::ExpList>
                 expList=((m_linsys.lock())->GetLocMat()).lock();
             LocalRegions::ExpansionSharedPtr locExpansion;
             GlobalLinSysKey linSysKey=(m_linsys.lock())->GetKey();

             int i, j, k;
             int nVerts, nEdges,nFaces;
             int eid, fid, n, cnt, nmodes, nedgemodes, nfacemodes;
             int nedgemodesloc;
             NekDouble zero = 0.0;

             int vMap1, vMap2, sign1, sign2;
             int m, v, eMap1, eMap2, fMap1, fMap2;
             int offset, globalrow, globalcol, nCoeffs;

             // Periodic information
             PeriodicMap periodicVerts;
             PeriodicMap periodicEdges;
             PeriodicMap periodicFaces;
             expList->GetPeriodicEntities(periodicVerts,periodicEdges,periodicFaces);

             //matrix storage
             MatrixStorage storage = eFULL;
             MatrixStorage vertstorage = eDIAGONAL;
             MatrixStorage blkmatStorage = eDIAGONAL;

             //local element static condensed matrices
             DNekScalBlkMatSharedPtr loc_mat;
             DNekScalMatSharedPtr    bnd_mat;

             DNekMatSharedPtr    pRSRT;

             DNekMat RS;
             DNekMat RSRT;

             auto asmMap = m_locToGloMap.lock();

             int nDirBnd      = asmMap->GetNumGlobalDirBndCoeffs();
             int nNonDirVerts = asmMap->GetNumNonDirVertexModes();

         //Vertex, edge and face preconditioner matrices
             DNekMatSharedPtr VertBlk = MemoryManager<DNekMat>::
                 AllocateSharedPtr(nNonDirVerts,nNonDirVerts,zero,vertstorage);

             Array<OneD, NekDouble> vertArray(nNonDirVerts,0.0);
             Array<OneD, long> VertBlockToUniversalMap(nNonDirVerts,-1);

             //maps for different element types
             int n_exp = expList->GetNumElmts();
             int nNonDirEdgeIDs=asmMap->GetNumNonDirEdges();
             int nNonDirFaceIDs=asmMap->GetNumNonDirFaces();

             set<int> edgeDirMap;
             set<int> faceDirMap;
             map<int,int> uniqueEdgeMap;
             map<int,int> uniqueFaceMap;

             //this should be of size total number of local edges + faces
             Array<OneD, int> modeoffset(1 +  nNonDirEdgeIDs + nNonDirFaceIDs,0);
             Array<OneD, int> globaloffset(1 + nNonDirEdgeIDs + nNonDirFaceIDs,0);

             const Array<OneD, const ExpListSharedPtr>& bndCondExp = expList->GetBndCondExpansions();
             LocalRegions::Expansion2DSharedPtr bndCondFaceExp;
             const Array<OneD, const SpatialDomains::BoundaryConditionShPtr>&
         bndConditions = expList->GetBndConditions();

             int meshVertId;
             int meshEdgeId;
             int meshFaceId;

             const Array<OneD, const int> &extradiredges
                 = asmMap->GetExtraDirEdges();
             for(i=0; i<extradiredges.num_elements(); ++i)
             {
                 meshEdgeId=extradiredges[i];
                 edgeDirMap.insert(meshEdgeId);
             }

             //Determine which boundary edges and faces have dirichlet values
             for(i = 0; i < bndCondExp.num_elements(); i++)
             {
                 cnt = 0;
                 for(j = 0; j < bndCondExp[i]->GetNumElmts(); j++)
                 {
                     bndCondFaceExp = std::dynamic_pointer_cast<
                     LocalRegions::Expansion2D>(bndCondExp[i]->GetExp(j));
                     if (bndConditions[i]->GetBoundaryConditionType() ==
                         SpatialDomains::eDirichlet)
                     {
                         for(k = 0; k < bndCondFaceExp->GetNedges(); k++)
                         {
                             meshEdgeId = bndCondFaceExp->as<LocalRegions::Expansion2D>()->GetGeom2D()->GetEid(k);
                             if(edgeDirMap.count(meshEdgeId) == 0)
                             {
                                 edgeDirMap.insert(meshEdgeId);
                             }
                         }
                         meshFaceId = bndCondFaceExp->as<LocalRegions::Expansion2D>()->GetGeom2D()->GetGlobalID();
                         faceDirMap.insert(meshFaceId);
                     }
                 }
             }

             int dof=0;
             int maxFaceDof=0;
             int maxEdgeDof=0;
             int nlocalNonDirEdges=0;
             int nlocalNonDirFaces=0;
             int ntotalentries=0;

             map<int,int> EdgeSize;
             map<int,int> FaceSize;
             map<int,pair<int,int> >FaceModes;

             /// -  Count  edges, face and add up min edges and min face sizes
             for(n = 0; n < n_exp; ++n)
             {
                 locExpansion = expList->GetExp(n);

                 nEdges = locExpansion->GetNedges();
                 for(j = 0; j < nEdges; ++j)
                 {
                     int nEdgeInteriorCoeffs = locExpansion->GetEdgeNcoeffs(j) - 2;
                     meshEdgeId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetEid(j);
                     if(EdgeSize.count(meshEdgeId) == 0)
                     {
                         EdgeSize[meshEdgeId] = nEdgeInteriorCoeffs;
                     }
                     else
                     {
                         EdgeSize[meshEdgeId] = min(EdgeSize[meshEdgeId],
                                                    nEdgeInteriorCoeffs);
                     }
                 }

                 nFaces = locExpansion->GetNfaces();
                 for(j = 0; j < nFaces; ++j)
                 {
                     int nFaceInteriorCoeffs = locExpansion->GetFaceIntNcoeffs(j);
                     meshFaceId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetFid(j);
                     if(FaceSize.count(meshFaceId) == 0)
                     {
                         FaceSize[meshFaceId] = nFaceInteriorCoeffs;

                         int m0,m1;
                         locExpansion->GetFaceNumModes(j,locExpansion->GetForient(j),m0,m1);
                         FaceModes[meshFaceId] = pair<int,int>(m0,m1);
                     }
                     else
                     {
                         if(nFaceInteriorCoeffs < FaceSize[meshFaceId])
                         {
                             FaceSize[meshFaceId] =  nFaceInteriorCoeffs;
                             int m0,m1;
                             locExpansion->GetFaceNumModes(j,locExpansion->GetForient(j),m0,m1);
                             FaceModes[meshFaceId] = pair<int,int>(m0,m1);
                         }
                     }
                 }
             }

             bool verbose =
                 expList->GetSession()->DefinesCmdLineArgument("verbose");

             // For parallel runs need to check have minimum of edges and faces over
             // partition boundaries
             if(m_comm->GetSize() > 1)
             {
                 int EdgeSizeLen = EdgeSize.size();
                 int FaceSizeLen = FaceSize.size();
                 Array<OneD, long>      FacetMap(EdgeSizeLen+FaceSizeLen,-1);
                 Array<OneD, NekDouble> FacetLen(EdgeSizeLen+FaceSizeLen,-1);

                 map<int,int>::iterator it;

                 cnt = 0;
                 int maxid = 0;
                 for(it = EdgeSize.begin(); it!=EdgeSize.end(); ++it,++cnt)
                 {
                     FacetMap[cnt] = it->first;
                     maxid = max(it->first,maxid);
                     FacetLen[cnt] = it->second;
                 }
                 maxid++;

                 m_comm->AllReduce(maxid,ReduceMax);

                 for(it = FaceSize.begin(); it!=FaceSize.end(); ++it,++cnt)
                 {
                     FacetMap[cnt] = it->first + maxid;
                     FacetLen[cnt] = it->second;
                 }

                 //Exchange vertex data over different processes
                 Gs::gs_data *tmp = Gs::Init(FacetMap, m_comm, verbose);
                 Gs::Gather(FacetLen, Gs::gs_min, tmp);

                 cnt = 0;
                 for(it = EdgeSize.begin(); it!=EdgeSize.end(); ++it,++cnt)
                 {
                     it->second = (int) FacetLen[cnt];
                 }

                 for(it = FaceSize.begin(); it!=FaceSize.end(); ++it,++cnt)
                 {
                     it->second = (int)FacetLen[cnt];
                 }
             }

             // Loop over all the elements in the domain and compute total edge
             // DOF and set up unique ordering.
             map<int,int> nblks;
             int matrixlocation = 0;

             // First do periodic edges
             for (auto &pIt : periodicEdges)
             {
                 meshEdgeId = pIt.first;

                 if(edgeDirMap.count(meshEdgeId)==0)
                 {
                     dof = EdgeSize[meshEdgeId];
                     if(uniqueEdgeMap.count(meshEdgeId)==0 && dof > 0)
                     {
                         bool SetUpNewEdge = true;


                         for (i = 0; i < pIt.second.size(); ++i)
                         {
                             if (!pIt.second[i].isLocal)
                             {
                                 continue;
                             }

                             int meshEdgeId2 = pIt.second[i].id;
                             if(edgeDirMap.count(meshEdgeId2)==0)
                             {
                                 if(uniqueEdgeMap.count(meshEdgeId2)!=0)
                                 {
                                     // set unique map to same location
                                     uniqueEdgeMap[meshEdgeId] =
                                         uniqueEdgeMap[meshEdgeId2];
                                     SetUpNewEdge = false;
                                 }
                             }
                             else
                             {
                                 edgeDirMap.insert(meshEdgeId);
                                 SetUpNewEdge = false;
                             }
                         }

                         if(SetUpNewEdge)
                         {
                             uniqueEdgeMap[meshEdgeId]=matrixlocation;
                             globaloffset[matrixlocation]+=ntotalentries;
                             modeoffset[matrixlocation]=dof*dof;
                             ntotalentries+=dof*dof;
                             nblks [matrixlocation++]  = dof;
                         }
                     }
                 }
             }

             for(cnt=n=0; n < n_exp; ++n)
             {
                 locExpansion = expList->GetExp(n);

                 for (j = 0; j < locExpansion->GetNedges(); ++j)
                 {
                     meshEdgeId = locExpansion->as<LocalRegions::Expansion3D>()->GetGeom3D()->GetEid(j);
                     dof    = EdgeSize[meshEdgeId];
                     maxEdgeDof = (dof > maxEdgeDof ? dof : maxEdgeDof);

                     if(edgeDirMap.count(meshEdgeId)==0)
                     {
                         if(uniqueEdgeMap.count(meshEdgeId)==0 && dof > 0)

                         {
                             uniqueEdgeMap[meshEdgeId]=matrixlocation;

                             globaloffset[matrixlocation]+=ntotalentries;
                             modeoffset[matrixlocation]=dof*dof;
                             ntotalentries+=dof*dof;
                             nblks[matrixlocation++]   = dof;
                         }
                         nlocalNonDirEdges+=dof*dof;
                     }
                 }
             }

             // Loop over all the elements in the domain and compute max face
             // DOF. Reduce across all processes to get universal maximum.
             // - Periodic faces
             for (auto &pIt : periodicFaces)
             {
                 meshFaceId = pIt.first;

                 if(faceDirMap.count(meshFaceId)==0)
                 {
                     dof = FaceSize[meshFaceId];

                     if(uniqueFaceMap.count(meshFaceId) == 0 && dof > 0)
                     {
                         bool SetUpNewFace = true;

                         if(pIt.second[0].isLocal)
                         {
                             int meshFaceId2 = pIt.second[0].id;

                             if(faceDirMap.count(meshFaceId2)==0)
                             {
                                 if(uniqueFaceMap.count(meshFaceId2)!=0)
                                 {
                                     // set unique map to same location
                                     uniqueFaceMap[meshFaceId] =
                                         uniqueFaceMap[meshFaceId2];
                                     SetUpNewFace = false;
                                 }
                             }
                             else // set face to be a Dirichlet face
                             {
                                 faceDirMap.insert(meshFaceId);
                                 SetUpNewFace = false;
                             }
                         }

                         if(SetUpNewFace)
                         {
                             uniqueFaceMap[meshFaceId]=matrixlocation;

                             modeoffset[matrixlocation]=dof*dof;
                             globaloffset[matrixlocation]+=ntotalentries;
                             ntotalentries+=dof*dof;
                             nblks[matrixlocation++] = dof;
                         }
                     }
                 }
             }

             for(cnt=n=0; n < n_exp; ++n)
             {
                 locExpansion = expList->GetExp(n);

                 for (j = 0; j < locExpansion->GetNfaces(); ++j)
                 {
                     meshFaceId = locExpansion->as<LocalRegions::Expansion3D>()->
                         GetGeom3D()->GetFid(j);

                     dof        = FaceSize[meshFaceId];
                     maxFaceDof = (dof > maxFaceDof ? dof : maxFaceDof);

                     if(faceDirMap.count(meshFaceId)==0)
                     {
                         if(uniqueFaceMap.count(meshFaceId)==0 && dof > 0)
                         {
                             uniqueFaceMap[meshFaceId]=matrixlocation;
                             modeoffset[matrixlocation]=dof*dof;
                             globaloffset[matrixlocation]+=ntotalentries;
                             ntotalentries+=dof*dof;
                             nblks[matrixlocation++] = dof;
                         }
                         nlocalNonDirFaces+=dof*dof;
                     }
                 }
             }

             m_comm->AllReduce(maxEdgeDof, ReduceMax);
             m_comm->AllReduce(maxFaceDof, ReduceMax);

             //Allocate arrays for block to universal map (number of expansions * p^2)
             Array<OneD, long> BlockToUniversalMap(ntotalentries,-1);
             Array<OneD, int> localToGlobalMatrixMap(nlocalNonDirEdges +
                                                     nlocalNonDirFaces,-1);

             //Allocate arrays to store matrices (number of expansions * p^2)
             Array<OneD, NekDouble> BlockArray(nlocalNonDirEdges +
                                               nlocalNonDirFaces,0.0);

             int matrixoffset=0;
             int vGlobal;
             int uniEdgeOffset = 0;

             // Need to obtain a fixed offset for the universal number
             // of the faces which come after the edge numbering
             for(n=0; n < n_exp; ++n)
             {
                 for(j = 0; j < locExpansion->GetNedges(); ++j)
                 {
                     meshEdgeId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetEid(j);

                     uniEdgeOffset = max(meshEdgeId, uniEdgeOffset);
                 }
             }
             uniEdgeOffset++;

             m_comm->AllReduce(uniEdgeOffset,ReduceMax);
             uniEdgeOffset = uniEdgeOffset*maxEdgeDof*maxEdgeDof;

             for(n=0; n < n_exp; ++n)
             {
                 locExpansion = expList->GetExp(n);

                 //loop over the edges of the expansion
                 for(j = 0; j < locExpansion->GetNedges(); ++j)
                 {
                     //get mesh edge id
                     meshEdgeId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetEid(j);

                     nedgemodes = EdgeSize[meshEdgeId];

                     if(edgeDirMap.count(meshEdgeId)==0 && nedgemodes > 0)
                     {
                         // Determine the Global edge offset
                         int edgeOffset = globaloffset[uniqueEdgeMap[meshEdgeId]];

                         // Determine a universal map offset
                         int uniOffset = meshEdgeId;
                         auto pIt = periodicEdges.find(meshEdgeId);
                         if (pIt != periodicEdges.end())
                         {
                             for (int l = 0; l < pIt->second.size(); ++l)
                             {
                                 uniOffset = min(uniOffset, pIt->second[l].id);
                             }
                         }
                         uniOffset = uniOffset*maxEdgeDof*maxEdgeDof;

                         for(k=0; k<nedgemodes*nedgemodes; ++k)
                         {
                             vGlobal=edgeOffset+k;
                             localToGlobalMatrixMap[matrixoffset+k]=vGlobal;
                             BlockToUniversalMap[vGlobal] = uniOffset + k + 1;
                         }
                         matrixoffset+=nedgemodes*nedgemodes;
                     }
                 }

                 Array<OneD, unsigned int>           faceInteriorMap;
                 Array<OneD, int>                    faceInteriorSign;
                 //loop over the faces of the expansion
                 for(j = 0; j < locExpansion->GetNfaces(); ++j)
                 {
                     //get mesh face id
                     meshFaceId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetFid(j);

                     nfacemodes = FaceSize[meshFaceId];

                     //Check if face has dirichlet values
                     if(faceDirMap.count(meshFaceId)==0 && nfacemodes > 0)
                     {
                         // Determine the Global edge offset
                         int faceOffset = globaloffset[uniqueFaceMap[meshFaceId]];
                         // Determine a universal map offset
                         int uniOffset = meshFaceId;
                         // use minimum face edge when periodic
                         auto pIt = periodicFaces.find(meshFaceId);
                         if (pIt != periodicFaces.end())
                         {
                             uniOffset = min(uniOffset, pIt->second[0].id);
                         }
                         uniOffset = uniOffset * maxFaceDof * maxFaceDof;

                         for(k=0; k<nfacemodes*nfacemodes; ++k)
                         {
                             vGlobal=faceOffset+k;

                             localToGlobalMatrixMap[matrixoffset+k]
                                 = vGlobal;

                             BlockToUniversalMap[vGlobal] = uniOffset +
                                 uniEdgeOffset + k + 1;
                         }
                         matrixoffset+=nfacemodes*nfacemodes;
                     }
                 }
             }

             matrixoffset=0;

             map<int,int>::iterator it;
             Array<OneD, unsigned int> n_blks(nblks.size()+1);
             n_blks[0] = nNonDirVerts;
             for(i =1, it = nblks.begin(); it != nblks.end(); ++it)
             {
                 n_blks[i++] = it->second;
             }

             m_BlkMat = MemoryManager<DNekBlkMat>
                 ::AllocateSharedPtr(n_blks, n_blks, blkmatStorage);

             //Here we loop over the expansion and build the block low energy
             //preconditioner as well as the block versions of the transformation
             //matrices.
             for(cnt=n=0; n < n_exp; ++n)
             {
                 locExpansion = expList->GetExp(n);
                 nCoeffs=locExpansion->NumBndryCoeffs();

                 //Get correct transformation matrix for element type
                 DNekMat &R = (*m_RBlk->GetBlock(n,n));

                 pRSRT = MemoryManager<DNekMat>::AllocateSharedPtr
                     (nCoeffs, nCoeffs, zero, storage);
                 RSRT = (*pRSRT);

                 nVerts=locExpansion->GetGeom()->GetNumVerts();
                 nEdges=locExpansion->GetGeom()->GetNumEdges();
                 nFaces=locExpansion->GetGeom()->GetNumFaces();

                 //Get statically condensed matrix
                 loc_mat = (m_linsys.lock())->GetStaticCondBlock(n);

                 //Extract boundary block (elemental S1)
                 bnd_mat=loc_mat->GetBlock(0,0);

                 //offset by number of rows
                 offset = bnd_mat->GetRows();

                 DNekScalMat &S=(*bnd_mat);

                 DNekMat Sloc(nCoeffs,nCoeffs);

                 // For variable p we need to just use the active modes
                 NekDouble mask1 = 1.0;
                 NekDouble mask2 = 1.0;
                 NekDouble val;

                 for(int i = 0; i < nCoeffs; ++i)
                 {
                     if(m_signChange)
                     {
                         mask1 = (m_locToGloSignMult[cnt+i] == 0.0)? 0.0:1.0;
                     }
                     for(int j = 0; j < nCoeffs; ++j)
                     {
                         if(m_signChange)
                         {
                             mask2 = (m_locToGloSignMult[cnt+j] == 0.0)? 0.0:1.0;
                         }
                         val = S(i,j)*mask1*mask2;
                         Sloc.SetValue(i,j,val);
                     }
                 }

                 //Calculate R*S*trans(R)
                 RSRT = R*Sloc*Transpose(R);

                 //loop over vertices of the element and return the vertex map
                 //for each vertex
                 for (v=0; v<nVerts; ++v)
                 {
                     vMap1=locExpansion->GetVertexMap(v);

                     //Get vertex map
                     globalrow = asmMap->
                         GetLocalToGlobalBndMap(cnt+vMap1)-nDirBnd;

                     if(globalrow >= 0)
                     {
                         for (m=0; m<nVerts; ++m)
                         {
                             vMap2=locExpansion->GetVertexMap(m);

                             //global matrix location (without offset due to
                             //dirichlet values)
                             globalcol = asmMap->
                                 GetLocalToGlobalBndMap(cnt+vMap2)-nDirBnd;

                             //offset for dirichlet conditions
                             if (globalcol == globalrow)
                             {
                                 //modal connectivity between elements
                                 sign1 = asmMap->
                                     GetLocalToGlobalBndSign(cnt + vMap1);
                                 sign2 = asmMap->
                                     GetLocalToGlobalBndSign(cnt + vMap2);

                                 vertArray[globalrow]
                                     += sign1*sign2*RSRT(vMap1,vMap2);


                                 meshVertId = locExpansion->as<LocalRegions::Expansion3D>()->GetGeom3D()->GetVid(v);

                                 auto pIt = periodicVerts.find(meshVertId);
                                 if (pIt != periodicVerts.end())
                                 {
                                     for (k = 0; k < pIt->second.size(); ++k)
                                     {
                                         meshVertId = min(meshVertId, pIt->second[k].id);
                                     }
                                 }

                                 VertBlockToUniversalMap[globalrow]
                                     = meshVertId + 1;
                             }
                         }
                     }
                 }

                 //loop over edges of the element and return the edge map
                 for (eid=0; eid<nEdges; ++eid)
                 {

                     meshEdgeId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetEid(eid);


                     nedgemodes    = EdgeSize[meshEdgeId];
                     if(nedgemodes)
                     {
                         nedgemodesloc = locExpansion->GetEdgeNcoeffs(eid)-2;
                         DNekMatSharedPtr m_locMat =
                             MemoryManager<DNekMat>::AllocateSharedPtr
                             (nedgemodes,nedgemodes,zero,storage);

                         Array<OneD, unsigned int> edgemodearray = locExpansion->GetEdgeInverseBoundaryMap(eid);

                         if(edgeDirMap.count(meshEdgeId)==0)
                         {
                             for (v=0; v<nedgemodesloc; ++v)
                             {
                                 eMap1=edgemodearray[v];
                                 sign1 = asmMap->
                                     GetLocalToGlobalBndSign(cnt + eMap1);

                                 if(sign1 == 0)
                                 {
                                     continue;
                                 }

                                 for (m=0; m<nedgemodesloc; ++m)
                                 {
                                     eMap2=edgemodearray[m];

                                     //modal connectivity between elements
                                     sign2 = asmMap->
                                         GetLocalToGlobalBndSign(cnt + eMap2);

                                     NekDouble globalEdgeValue = sign1*sign2*RSRT(eMap1,eMap2);

                                     if(sign2 != 0)
                                     {
                                         //if(eMap1 == eMap2)
                                         BlockArray[matrixoffset+v*nedgemodes+m]=globalEdgeValue;
                                     }
                                 }
                             }
                             matrixoffset+=nedgemodes*nedgemodes;
                         }
                     }
                 }

                 //loop over faces of the element and return the face map
                 for (fid=0; fid<nFaces; ++fid)
                 {
                     meshFaceId = locExpansion->as<LocalRegions::Expansion3D>()
                         ->GetGeom3D()->GetFid(fid);

                     nfacemodes   = FaceSize[meshFaceId];
                     if(nfacemodes > 0)
                     {
                         DNekMatSharedPtr m_locMat =
                             MemoryManager<DNekMat>::AllocateSharedPtr
                             (nfacemodes,nfacemodes,zero,storage);

                         if(faceDirMap.count(meshFaceId) == 0)
                         {
                             Array<OneD, unsigned int> facemodearray;
                             StdRegions::Orientation faceOrient =
                                 locExpansion->GetForient(fid);

                             auto pIt = periodicFaces.find(meshFaceId);
                             if (pIt != periodicFaces.end())
                             {
                                 if(meshFaceId == min(meshFaceId, pIt->second[0].id))
                                 {
                                     faceOrient = DeterminePeriodicFaceOrient
                                         (faceOrient,pIt->second[0].orient);
                                 }
                             }

                             facemodearray = locExpansion->GetFaceInverseBoundaryMap
                                 (fid,faceOrient,FaceModes[meshFaceId].first,
                                  FaceModes[meshFaceId].second);

                             for (v=0; v<nfacemodes; ++v)
                             {
                                 fMap1=facemodearray[v];

                                 sign1 = asmMap->
                                     GetLocalToGlobalBndSign(cnt + fMap1);

                                 ASSERTL1(sign1 != 0,"Something is wrong since we "
                                          "shoudl only be extracting modes for "
                                          "lowest order expansion");

                                 for (m=0; m<nfacemodes; ++m)
                                 {
                                     fMap2=facemodearray[m];

                                     //modal connectivity between elements
                                     sign2 = asmMap->
                                         GetLocalToGlobalBndSign(cnt + fMap2);

                                     ASSERTL1(sign2 != 0,"Something is wrong since "
                                              "we shoudl only be extracting modes for "
                                              "lowest order expansion");

                                     // Get the face-face value from the
                                     // low energy matrix (S2)
                                     NekDouble globalFaceValue = sign1*sign2*
                                         RSRT(fMap1,fMap2);

                                     //local face value to global face value
                                     //if(fMap1 == fMap2)
                                     BlockArray[matrixoffset+v*nfacemodes+m]=
                                         globalFaceValue;
                                 }
                             }
                             matrixoffset+=nfacemodes*nfacemodes;
                         }
                     }
                 }

                 //offset for the expansion
                 cnt+=nCoeffs;
             }

             if(nNonDirVerts!=0)
             {
                 //Exchange vertex data over different processes
                 Gs::gs_data *tmp = Gs::Init(VertBlockToUniversalMap, m_comm, verbose);
                 Gs::Gather(vertArray, Gs::gs_add, tmp);

             }

             Array<OneD, NekDouble> GlobalBlock(ntotalentries,0.0);
             if(ntotalentries)
             {
                 //Assemble edge matrices of each process
                 Vmath::Assmb(BlockArray.num_elements(),
                              BlockArray,
                              localToGlobalMatrixMap,
                              GlobalBlock);
             }

             //Exchange edge & face data over different processes
             Gs::gs_data *tmp1 = Gs::Init(BlockToUniversalMap, m_comm, verbose);
             Gs::Gather(GlobalBlock, Gs::gs_add, tmp1);

             // Populate vertex block
             for (int i = 0; i < nNonDirVerts; ++i)
             {
                 VertBlk->SetValue(i,i,1.0/vertArray[i]);
             }

             //Set the first block to be the diagonal of the vertex space
             m_BlkMat->SetBlock(0,0, VertBlk);

             //Build the edge and face matrices from the vector
             DNekMatSharedPtr gmat;

             offset=0;
             // -1 since we ignore vert block
             for(int loc=0; loc<n_blks.num_elements()-1; ++loc)
             {
                 nmodes = n_blks[1+loc];
                 gmat = MemoryManager<DNekMat>::AllocateSharedPtr
                     (nmodes,nmodes,zero,storage);

                 for (v=0; v<nmodes; ++v)
                 {
                     for (m=0; m<nmodes; ++m)
                     {
                         NekDouble Value = GlobalBlock[offset+v*nmodes+m];
                         gmat->SetValue(v,m,Value);

                     }
                 }
                 m_BlkMat->SetBlock(1+loc,1+loc, gmat);
                 offset+=modeoffset[loc];
             }

             // invert blocks.
             int totblks=m_BlkMat->GetNumberOfBlockRows();
             for (i=1; i< totblks; ++i)
             {
                 unsigned int nmodes=m_BlkMat->GetNumberOfRowsInBlockRow(i);
                 if(nmodes)
                 {
                     DNekMatSharedPtr tmp_mat =
                     MemoryManager<DNekMat>::AllocateSharedPtr
                     (nmodes,nmodes,zero,storage);

                     tmp_mat=m_BlkMat->GetBlock(i,i);
                     tmp_mat->Invert();

                     m_BlkMat->SetBlock(i,i,tmp_mat);
                 }
             }
         }


         /**
          * Apply the low energy preconditioner during the conjugate gradient
          * routine
          */
         void PreconditionerLowEnergy::v_DoPreconditioner(
                 const Array<OneD, NekDouble>& pInput,
                       Array<OneD, NekDouble>& pOutput)
         {
             int nDir    = m_locToGloMap.lock()->GetNumGlobalDirBndCoeffs();
             int nGlobal = m_locToGloMap.lock()->GetNumGlobalBndCoeffs();
             int nNonDir = nGlobal-nDir;
             DNekBlkMat &M = (*m_BlkMat);

             NekVector<NekDouble> r(nNonDir,pInput,eWrapper);
             NekVector<NekDouble> z(nNonDir,pOutput,eWrapper);

             z = M * r;
     }


         /**
          * Set a block transformation matrices for each element type. These are
          * needed in routines that transform the schur complement matrix to and
          * from the low energy basis.
          */
         void PreconditionerLowEnergy::SetupBlockTransformationMatrix(void)
         {
             std::shared_ptr<MultiRegions::ExpList>
                 expList=((m_linsys.lock())->GetLocMat()).lock();
             StdRegions::StdExpansionSharedPtr locExp;
             StdRegions::StdExpansionSharedPtr locExpSav;
             map<int,int> EdgeSize;

             int n;

             std::map<ShapeType, DNekScalMatSharedPtr>         maxRmat;
             map<ShapeType, LocalRegions::ExpansionSharedPtr > maxElmt;
             map<ShapeType, Array<OneD, unsigned int> >        vertMapMaxR;
             map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > edgeMapMaxR;


             //Sets up reference element and builds transformation matrix for
             // maximum polynomial order meshes
             SetUpReferenceElements(maxRmat,maxElmt,vertMapMaxR,edgeMapMaxR);

             const Array<OneD,const unsigned int>& nbdry_size
                 = m_locToGloMap.lock()->GetNumLocalBndCoeffsPerPatch();

             int n_exp=expList->GetNumElmts();

             MatrixStorage blkmatStorage = eDIAGONAL;

             //Variants of R matrices required for low energy preconditioning
             m_RBlk      = MemoryManager<DNekBlkMat>
                 ::AllocateSharedPtr(nbdry_size, nbdry_size , blkmatStorage);
             m_InvRBlk      = MemoryManager<DNekBlkMat>
                 ::AllocateSharedPtr(nbdry_size, nbdry_size , blkmatStorage);

             DNekMatSharedPtr rmat, invrmat;

             int offset = 0;

             // Set up transformation matrices whilst checking to see if
             // consecutive matrices are the same and if so reuse the
             // matrices and store how many consecutive offsets there
             // are
             for(n=0; n < n_exp; ++n)
             {
                 locExp = expList->GetExp(n);
                 ShapeType eltype = locExp->DetShapeType();

                 int nbndcoeffs = locExp->NumBndryCoeffs();

                 if(m_sameBlock.size() == 0)
                 {
                     rmat = ExtractLocMat(locExp,maxRmat[eltype],
                                          maxElmt[eltype],
                                          vertMapMaxR[eltype],
                                          edgeMapMaxR[eltype]);
                     //Block R matrix
                     m_RBlk->SetBlock(n, n, rmat);

                     invrmat = MemoryManager<DNekMat>::AllocateSharedPtr(*rmat);
                     invrmat->Invert();

                     //Block inverse R matrix
                     m_InvRBlk->SetBlock(n, n, invrmat);

                     m_sameBlock.push_back(pair<int,int>(1,nbndcoeffs));
                     locExpSav = locExp;
                 }
                 else
                 {
                     bool reuse = true;

                     // check to see if same as previous matrix and
                     // reuse if we can
                     for(int i = 0; i < 3; ++i)
                     {
                         if(locExpSav->GetBasis(i) != locExp->GetBasis(i))
                         {
                             reuse = false;
                             break;
                         }
                     }

                     if(reuse)
                     {
                         m_RBlk->SetBlock(n, n, rmat);
                         m_InvRBlk->SetBlock(n, n, invrmat);

                         m_sameBlock[offset] =
                             (pair<int,int>(m_sameBlock[offset].first+1,nbndcoeffs));
                     }
                     else
                     {
                         rmat = ExtractLocMat(locExp,maxRmat[eltype],
                                              maxElmt[eltype],
                                              vertMapMaxR[eltype],
                                              edgeMapMaxR[eltype]);

                         //Block R matrix
                         m_RBlk->SetBlock(n, n, rmat);

                         invrmat = MemoryManager<DNekMat>::AllocateSharedPtr(*rmat);
                         invrmat->Invert();
                         //Block inverse R matrix
                         m_InvRBlk->SetBlock(n, n, invrmat);

                         m_sameBlock.push_back(pair<int,int>(1,nbndcoeffs));
                         offset++;
                         locExpSav = locExp;
                     }
                 }
             }
         }

         /**
          * \brief Transform the solution vector vector to low energy.
          *
          * As the conjugate gradient system is solved for the low energy basis,
          * the solution vector \f$\mathbf{x}\f$ must be transformed to the low
          * energy basis i.e. \f$\overline{\mathbf{x}}=\mathbf{R}\mathbf{x}\f$.
          */
         void PreconditionerLowEnergy::v_DoTransformToLowEnergy(
                                                                Array<OneD, NekDouble>& pInOut,
                                                                int offset)
         {
             auto asmMap = m_locToGloMap.lock();
             int nGlobBndDofs       = asmMap->GetNumGlobalBndCoeffs();
             int nDirBndDofs        = asmMap->GetNumGlobalDirBndCoeffs();
             int nGlobHomBndDofs    = nGlobBndDofs - nDirBndDofs;
             int nLocBndDofs        = asmMap->GetNumLocalBndCoeffs();

             //Non-dirichlet boundary dofs
             Array<OneD, NekDouble> tmpOffset = pInOut + offset;
             NekVector<NekDouble> F_HomBnd(nGlobHomBndDofs, tmpOffset, eWrapper);

             //Block transformation matrix
             DNekBlkMat &R = *m_RBlk;

             Array<OneD, NekDouble> pLocal(nLocBndDofs, 0.0);
             NekVector<NekDouble> F_LocBnd(nLocBndDofs,pLocal,eWrapper);
             m_map = asmMap->GetLocalToGlobalBndMap();
             Array<OneD, NekDouble> pLocalIn(nLocBndDofs, 0.0);

             //Not actually needed but we should only work with the
             //Global boundary dofs
             Array<OneD,NekDouble> tmp(nGlobBndDofs,0.0);
             Vmath::Vcopy(nGlobBndDofs, pInOut.get(), 1, tmp.get(), 1);

             //Global boundary (with dirichlet values) to local
             //boundary with multiplicity
             Vmath::Gathr(m_map.num_elements(), m_locToGloSignMult.get(),
                          tmp.get(), m_map.get(), pLocalIn.get());

         //Multiply by the block transformation matrix
         int cnt = 0;
         int cnt1 = 0;
         for(int i = 0; i < m_sameBlock.size(); ++i)
             {
             int nexp    = m_sameBlock[i].first;
         int nbndcoeffs = m_sameBlock[i].second;
         Blas::Dgemm('N','N', nbndcoeffs, nexp, nbndcoeffs,
                 1.0, &(R.GetBlock(cnt1,cnt1)->GetPtr()[0]),
                             nbndcoeffs,pLocalIn.get() + cnt,  nbndcoeffs,
                 0.0, pLocal.get() + cnt, nbndcoeffs);
         cnt  += nbndcoeffs*nexp;
         cnt1 += nexp;
         }

             //Assemble local boundary to global non-dirichlet Dofs
             asmMap->AssembleBnd(F_LocBnd,F_HomBnd, nDirBndDofs);
         }

         /**
          * \brief Transform the solution vector to low energy form.
          *
          * As the conjugate gradient system is solved for the low energy basis,
          * the solution vector \f$\mathbf{x}\f$ must be transformed to the low
          * energy basis i.e. \f$\overline{\mathbf{x}}=\mathbf{R}\mathbf{x}\f$.
          */
         void PreconditionerLowEnergy::v_DoTransformToLowEnergy(
                                                                const Array<OneD, NekDouble>& pInput,
                                                                Array<OneD, NekDouble>& pOutput)
         {
             auto asmMap = m_locToGloMap.lock();

             int nGlobBndDofs       = asmMap->GetNumGlobalBndCoeffs();
             int nDirBndDofs        = asmMap->GetNumGlobalDirBndCoeffs();
             int nGlobHomBndDofs    = nGlobBndDofs - nDirBndDofs;
             int nLocBndDofs        = asmMap->GetNumLocalBndCoeffs();

             //Input/output vectors should be length nGlobHomBndDofs
             ASSERTL1(pInput.num_elements() >= nGlobHomBndDofs,
                      "Input array is greater than the nGlobHomBndDofs");
             ASSERTL1(pOutput.num_elements() >= nGlobHomBndDofs,
                      "Output array is greater than the nGlobHomBndDofs");

             //vectors of length number of non-dirichlet boundary dofs
             NekVector<NekDouble> F_HomBnd(nGlobHomBndDofs,pOutput,
                                           eWrapper);
             //Block transformation matrix
             DNekBlkMat &R = *m_RBlk;

             Array<OneD, NekDouble> pLocal(nLocBndDofs, 0.0);
             NekVector<NekDouble> F_LocBnd(nLocBndDofs,pLocal,eWrapper);
             m_map = asmMap->GetLocalToGlobalBndMap();
             Array<OneD, NekDouble> pLocalIn(nLocBndDofs, 0.0);

             // Allocated array of size number of global boundary dofs and copy
             // the input array to the tmp array offset by Dirichlet boundary
             // conditions.
             Array<OneD,NekDouble> tmp(nGlobBndDofs,0.0);
             Vmath::Vcopy(nGlobHomBndDofs, pInput.get(), 1, tmp.get()
                          + nDirBndDofs, 1);

             //Global boundary dofs (with zeroed dirichlet values) to
             //local boundary dofs - This also divides by the mulplicity
             Vmath::Gathr(m_map.num_elements(), m_locToGloSignMult.get(),
                          tmp.get(), m_map.get(), pLocalIn.get());

             //Multiply by the block transformation matrix
         int cnt = 0;
         int cnt1 = 0;
         for(int i = 0; i < m_sameBlock.size(); ++i)
             {
             int nexp    = m_sameBlock[i].first;
         int nbndcoeffs = m_sameBlock[i].second;
         Blas::Dgemm('N','N', nbndcoeffs, nexp, nbndcoeffs,
                 1.0, &(R.GetBlock(cnt1,cnt1)->GetPtr()[0]),
                             nbndcoeffs,pLocalIn.get() + cnt,  nbndcoeffs,
                 0.0, pLocal.get() + cnt, nbndcoeffs);
         cnt  += nbndcoeffs*nexp;
         cnt1 += nexp;
         }

             //Assemble local boundary to global non-dirichlet boundary
             asmMap->AssembleBnd(F_LocBnd,F_HomBnd,nDirBndDofs);
         }

         /**
          * \brief transform the solution vector from low energy back to the
          * original basis.
          *
          * After the conjugate gradient routine the output vector is in the low
          * energy basis and must be trasnformed back to the original basis in
          * order to get the correct solution out. the solution vector
          * i.e. \f$\mathbf{x}=\mathbf{R^{T}}\mathbf{\overline{x}}\f$.
          */
         void PreconditionerLowEnergy::v_DoTransformFromLowEnergy(
                                                                  Array<OneD, NekDouble>& pInOut)
         {
             auto asmMap = m_locToGloMap.lock();

             int nGlobBndDofs       = asmMap->GetNumGlobalBndCoeffs();
             int nDirBndDofs        = asmMap->GetNumGlobalDirBndCoeffs();
             int nGlobHomBndDofs    = nGlobBndDofs - nDirBndDofs;
             int nLocBndDofs        = asmMap->GetNumLocalBndCoeffs();

             ASSERTL1(pInOut.num_elements() >= nGlobBndDofs,
                      "Output array is greater than the nGlobBndDofs");

             //Block  transformation matrix
             DNekBlkMat &R = *m_RBlk;

             Array<OneD, NekDouble> tmpOffset = pInOut + nDirBndDofs;
             NekVector<NekDouble> V_GlobHomBnd(nGlobHomBndDofs, tmpOffset, eWrapper);

             Array<OneD, NekDouble> pLocalIn(nLocBndDofs, 0.0);
             NekVector<NekDouble> V_LocBnd(nLocBndDofs,pLocalIn,eWrapper);
             m_map = asmMap->GetLocalToGlobalBndMap();
             Array<OneD,NekDouble> tmp(nGlobBndDofs,0.0);
             Array<OneD, NekDouble> pLocal(nLocBndDofs, 0.0);

             //Global boundary (less dirichlet) to local boundary
             asmMap->GlobalToLocalBnd(V_GlobHomBnd,V_LocBnd, nDirBndDofs);

             //Multiply by the transpose of block transformation matrix
         int cnt = 0;
         int cnt1 = 0;
         for(int i = 0; i < m_sameBlock.size(); ++i)
             {
             int nexp    = m_sameBlock[i].first;
         int nbndcoeffs = m_sameBlock[i].second;
         Blas::Dgemm('T','N', nbndcoeffs, nexp, nbndcoeffs,
                 1.0, &(R.GetBlock(cnt1,cnt1)->GetPtr()[0]),
                             nbndcoeffs,pLocalIn.get() + cnt,  nbndcoeffs,
                 0.0, pLocal.get() + cnt, nbndcoeffs);
         cnt  += nbndcoeffs*nexp;
         cnt1 += nexp;
         }

             //Assemble local boundary to global boundary
             Vmath::Assmb(nLocBndDofs, m_locToGloSignMult.get(),pLocal.get(), m_map.get(), tmp.get());

             //Universal assemble across processors
             asmMap->UniversalAssembleBnd(tmp);

             //copy non-dirichlet boundary values
             Vmath::Vcopy(nGlobBndDofs-nDirBndDofs, tmp.get() + nDirBndDofs, 1, pInOut.get() + nDirBndDofs, 1);
         }

         /**
          * \brief Multiply by the block inverse transformation matrix
          */
         void PreconditionerLowEnergy::v_DoMultiplybyInverseTransformationMatrix(
                                                                                 const Array<OneD, NekDouble>& pInput,
                                                                                 Array<OneD, NekDouble>& pOutput)
         {
             auto asmMap = m_locToGloMap.lock();

             int nGlobBndDofs       = asmMap->GetNumGlobalBndCoeffs();
             int nDirBndDofs        = asmMap->GetNumGlobalDirBndCoeffs();
             int nGlobHomBndDofs    = nGlobBndDofs - nDirBndDofs;
             int nLocBndDofs        = asmMap->GetNumLocalBndCoeffs();

             ASSERTL1(pInput.num_elements() >= nGlobHomBndDofs,
                      "Input array is greater than the nGlobHomBndDofs");
             ASSERTL1(pOutput.num_elements() >= nGlobHomBndDofs,
                      "Output array is greater than the nGlobHomBndDofs");

             //vectors of length number of non-dirichlet boundary dofs
             NekVector<NekDouble> F_GlobBnd(nGlobHomBndDofs,pInput,eWrapper);
             NekVector<NekDouble> F_HomBnd(nGlobHomBndDofs,pOutput,
                                           eWrapper);
             //Block inverse transformation matrix
             DNekBlkMat &invR = *m_InvRBlk;

             Array<OneD, NekDouble> pLocal(nLocBndDofs, 0.0);
             NekVector<NekDouble> F_LocBnd(nLocBndDofs,pLocal,eWrapper);
             m_map = asmMap->GetLocalToGlobalBndMap();
             Array<OneD, NekDouble> pLocalIn(nLocBndDofs, 0.0);

             // Allocated array of size number of global boundary dofs and copy
             // the input array to the tmp array offset by Dirichlet boundary
             // conditions.
             Array<OneD,NekDouble> tmp(nGlobBndDofs,0.0);
             Vmath::Vcopy(nGlobHomBndDofs, pInput.get(), 1, tmp.get() + nDirBndDofs, 1);

             //Global boundary dofs (with zeroed dirichlet values) to
             //local boundary dofs
             Vmath::Gathr(m_map.num_elements(), m_locToGloSignMult.get(),
                          tmp.get(), m_map.get(), pLocalIn.get());

             //Multiply by the inverse transformation matrix
         int cnt = 0;
         int cnt1 = 0;
         for(int i = 0; i < m_sameBlock.size(); ++i)
             {
             int nexp    = m_sameBlock[i].first;
         int nbndcoeffs = m_sameBlock[i].second;
         Blas::Dgemm('N','N', nbndcoeffs, nexp, nbndcoeffs,
                 1.0, &(invR.GetBlock(cnt1,cnt1)->GetPtr()[0]),
                             nbndcoeffs,pLocalIn.get() + cnt,  nbndcoeffs,
                 0.0, pLocal.get() + cnt, nbndcoeffs);
         cnt  += nbndcoeffs*nexp;
         cnt1 += nexp;
         }


             //Assemble local boundary to global non-dirichlet boundary
             asmMap->AssembleBnd(F_LocBnd,F_HomBnd,nDirBndDofs);

     }

         /**
          * \brief Multiply by the block tranposed inverse transformation matrix
          */
         void PreconditionerLowEnergy::v_DoMultiplybyInverseTransposedTransformationMatrix(
                                                                                           const Array<OneD, NekDouble>& pInput,
                                                                                           Array<OneD, NekDouble>& pOutput)
         {
             auto asmMap = m_locToGloMap.lock();

             int nGlobBndDofs       = asmMap->GetNumGlobalBndCoeffs();
             int nDirBndDofs        = asmMap->GetNumGlobalDirBndCoeffs();
             int nGlobHomBndDofs    = nGlobBndDofs - nDirBndDofs;
             int nLocBndDofs        = asmMap->GetNumLocalBndCoeffs();

             ASSERTL1(pInput.num_elements() >= nGlobHomBndDofs,
                      "Input array is greater than the nGlobHomBndDofs");
             ASSERTL1(pOutput.num_elements() >= nGlobHomBndDofs,
                      "Output array is greater than the nGlobHomBndDofs");

             //vectors of length number of non-dirichlet boundary dofs
             NekVector<NekDouble> F_GlobBnd(nGlobHomBndDofs,pInput,eWrapper);
             NekVector<NekDouble> F_HomBnd(nGlobHomBndDofs,pOutput,
                                           eWrapper);
             //Block inverse transformation matrix
             DNekBlkMat &invR = *m_InvRBlk;

             Array<OneD, NekDouble> pLocalIn(nLocBndDofs, 0.0);
             NekVector<NekDouble> F_LocBnd(nLocBndDofs,pLocalIn,eWrapper);
             m_map = asmMap->GetLocalToGlobalBndMap();
             Array<OneD, NekDouble> pLocal(nLocBndDofs, 0.0);

             asmMap->GlobalToLocalBnd(pInput,pLocalIn, nDirBndDofs);


             //Multiply by the transpose of block transformation matrix
         int cnt = 0;
         int cnt1 = 0;
         for(int i = 0; i < m_sameBlock.size(); ++i)
             {
             int nexp    = m_sameBlock[i].first;
         int nbndcoeffs = m_sameBlock[i].second;
         Blas::Dgemm('T','N', nbndcoeffs, nexp, nbndcoeffs,
                 1.0, &(invR.GetBlock(cnt1,cnt1)->GetPtr()[0]),
                             nbndcoeffs,pLocalIn.get() + cnt,  nbndcoeffs,
                 0.0, pLocal.get() + cnt, nbndcoeffs);
         cnt  += nbndcoeffs*nexp;
         cnt1 += nexp;
         }


             asmMap->AssembleBnd(pLocal,pOutput, nDirBndDofs);

             Vmath::Vmul(nGlobHomBndDofs,pOutput,1,m_multiplicity,1,pOutput,1);
     }


         /**
          * \brief Set up the transformed block  matrix system
          *
          * Sets up a block elemental matrix in which each of the block matrix is
          * the low energy equivalent
          * i.e. \f$\mathbf{S}_{2}=\mathbf{R}\mathbf{S}_{1}\mathbf{R}^{T}\f$
          */
         DNekScalMatSharedPtr PreconditionerLowEnergy::
         v_TransformedSchurCompl( int n,
                                  int bndoffset,
                                  const std::shared_ptr<DNekScalMat > &loc_mat)
     {
             std::shared_ptr<MultiRegions::ExpList>
                 expList=((m_linsys.lock())->GetLocMat()).lock();

             LocalRegions::ExpansionSharedPtr locExpansion;
             locExpansion = expList->GetExp(n);
             unsigned int nbnd=locExpansion->NumBndryCoeffs();

             MatrixStorage storage = eFULL;
             DNekMatSharedPtr pS2 = MemoryManager<DNekMat>::
                 AllocateSharedPtr(nbnd,nbnd,0.0,storage);

             //transformation matrices
             DNekMat &R = (*m_RBlk->GetBlock(n,n));

             // Original Schur Complement
             DNekScalMat &S1 = (*loc_mat);

             DNekMat Sloc(nbnd,nbnd);

             // For variable p we need to just use the active modes
             NekDouble mask1 = 1.0;
             NekDouble mask2 = 1.0;
             NekDouble val;

             for(int i = 0; i < nbnd; ++i)
             {
                 if(m_signChange)
                 {
                     mask1 = (m_locToGloSignMult[bndoffset+i] == 0.0)? 0.0:1.0;
                 }
                 for(int j = 0; j < nbnd; ++j)
                 {
                     if(m_signChange)
                     {
                         mask2 = (m_locToGloSignMult[bndoffset+j] == 0.0)? 0.0:1.0;
                     }
                     val = S1(i,j)*mask1*mask2;
                     Sloc.SetValue(i,j,val);
                 }
             }

             //create low energy matrix
             DNekMat &S2 = (*pS2);

             S2= R*Sloc*Transpose(R);

             DNekScalMatSharedPtr return_val;
             return_val = MemoryManager<DNekScalMat>::AllocateSharedPtr(1.0, pS2);

         return return_val;
     }

         /**
          * Create the inverse multiplicity map.
          */
         void PreconditionerLowEnergy::CreateMultiplicityMap(void)
         {
             auto asmMap = m_locToGloMap.lock();

             unsigned int nGlobalBnd = asmMap->GetNumGlobalBndCoeffs();
             unsigned int nEntries   = asmMap->GetNumLocalBndCoeffs();
             unsigned int i;

             const Array<OneD, const int> &vMap
                 = asmMap->GetLocalToGlobalBndMap();

             const Array< OneD, const NekDouble > &sign
                 = asmMap->GetLocalToGlobalBndSign();

             m_signChange=asmMap->GetSignChange();

             // Count the multiplicity of each global DOF on this process
             Array<OneD, NekDouble> vCounts(nGlobalBnd, 0.0);
             if(m_signChange)
             {
                 for (i = 0; i < nEntries; ++i)
                 {
                     if(fabs(sign[i]) > 0.0)
                     {
                         vCounts[vMap[i]] += 1.0;
                     }
                     else // set zero modes to 1 so inverse below does not cause problems
                     {
                         vCounts[vMap[i]] = 1.0;
                     }
                 }
             }
             else
             {
                 for (i = 0; i < nEntries; ++i)
                 {
                     vCounts[vMap[i]] += 1.0;
                 }
             }

             // Get universal multiplicity by globally assembling counts
             asmMap->UniversalAssembleBnd(vCounts);

             // Construct a map of 1/multiplicity
             m_locToGloSignMult = Array<OneD, NekDouble>(nEntries);
             for (i = 0; i < nEntries; ++i)
             {
                 if(m_signChange)
                 {
                     m_locToGloSignMult[i] = sign[i]*1.0/vCounts[vMap[i]];
                 }
                 else
                 {
                     m_locToGloSignMult[i] = 1.0/vCounts[vMap[i]];
                 }
             }

             int nDirBnd     = asmMap->GetNumGlobalDirBndCoeffs();
             int nGlobHomBnd = nGlobalBnd - nDirBnd;
             int nLocBnd     = asmMap->GetNumLocalBndCoeffs();

             //Set up multiplicity array for inverse transposed transformation matrix
             Array<OneD,NekDouble> tmp(nGlobHomBnd,1.0);
             m_multiplicity = Array<OneD,NekDouble>(nGlobHomBnd,1.0);
             Array<OneD,NekDouble> loc(nLocBnd,1.0);

             asmMap->GlobalToLocalBnd(tmp,loc, nDirBnd);
             asmMap->AssembleBnd(loc,m_multiplicity, nDirBnd);
             Vmath::Sdiv(nGlobHomBnd,1.0,m_multiplicity,1,m_multiplicity,1);

         }

         /**
          *\brief Sets up the reference prismatic element needed to construct
          *a low energy basis
          */
         SpatialDomains::PrismGeomSharedPtr PreconditionerLowEnergy::CreateRefPrismGeom()
         {
             //////////////////////////
             // Set up Prism element //
             //////////////////////////

         const int three=3;
             const int nVerts = 6;
             const double point[][3] = {
                 {-1,-1,0}, {1,-1,0}, {1,1,0},
                 {-1,1,0}, {0,-1,sqrt(double(3))}, {0,1,sqrt(double(3))},
             };

             //std::shared_ptr<SpatialDomains::PointGeom> verts[6];
             SpatialDomains::PointGeomSharedPtr verts[6];
             for(int i=0; i < nVerts; ++i)
             {
                 verts[i] =  MemoryManager<SpatialDomains::PointGeom>::AllocateSharedPtr
                     ( three, i, point[i][0], point[i][1], point[i][2] );
             }
             const int nEdges = 9;
             const int vertexConnectivity[][2] = {
                 {0,1}, {1,2}, {3,2}, {0,3}, {0,4},
                 {1,4}, {2,5}, {3,5}, {4,5}
             };

             // Populate the list of edges
             SpatialDomains::SegGeomSharedPtr edges[nEdges];
             for(int i=0; i < nEdges; ++i){
                 SpatialDomains::PointGeomSharedPtr vertsArray[2];
                 for(int j=0; j<2; ++j)
                 {
                     vertsArray[j] = verts[vertexConnectivity[i][j]];
                 }
                 edges[i] = MemoryManager<SpatialDomains::SegGeom>::AllocateSharedPtr(i, three, vertsArray);
             }

             ////////////////////////
             // Set up Prism faces //
             ////////////////////////

             const int nFaces = 5;
             //quad-edge connectivity base-face0, vertical-quadface2, vertical-quadface4
             const int quadEdgeConnectivity[][4] = { {0,1,2,3}, {1,6,8,5}, {3,7,8,4} };
             // QuadId ordered as 0, 1, 2, otherwise return false
             const int                  quadId[] = { 0,-1,1,-1,2 };

             //triangle-edge connectivity side-triface-1, side triface-3
             const int  triEdgeConnectivity[][3] = { {0,5,4}, {2,6,7} };
             // TriId ordered as 0, 1, otherwise return false
             const int                   triId[] = { -1,0,-1,1,-1 };

             // Populate the list of faces
             SpatialDomains::Geometry2DSharedPtr faces[nFaces];
             for(int f = 0; f < nFaces; ++f){
                 if(f == 1 || f == 3) {
                     int i = triId[f];
                     SpatialDomains::SegGeomSharedPtr edgeArray[3];
                     for(int j = 0; j < 3; ++j){
                         edgeArray[j] = edges[triEdgeConnectivity[i][j]];
                     }
                     faces[f] = MemoryManager<SpatialDomains::TriGeom>::AllocateSharedPtr(f, edgeArray);
                 }
                 else {
                     int i = quadId[f];
                     SpatialDomains::SegGeomSharedPtr edgeArray[4];
                     for(int j=0; j < 4; ++j){
                         edgeArray[j] = edges[quadEdgeConnectivity[i][j]];
                     }
                     faces[f] = MemoryManager<SpatialDomains::QuadGeom>::AllocateSharedPtr(f, edgeArray);
                 }
             }

             SpatialDomains::PrismGeomSharedPtr geom = MemoryManager<SpatialDomains::PrismGeom>::AllocateSharedPtr(0, faces);

             return geom;
         }

         /**
          *\brief Sets up the reference prismatic element needed to construct
          *a low energy basis mapping arrays
          */
         SpatialDomains::PyrGeomSharedPtr PreconditionerLowEnergy::CreateRefPyrGeom()
         {
             //////////////////////////
             // Set up Pyramid element //
             //////////////////////////

             const int nVerts = 5;
             const double point[][3] = {
                 {-1,-1,0}, {1,-1,0}, {1,1,0},
                 {-1,1,0}, {0,0,sqrt(double(2))}
             };

             //boost::shared_ptr<SpatialDomains::PointGeom> verts[6];
         const int three=3;
             SpatialDomains::PointGeomSharedPtr verts[5];
             for(int i=0; i < nVerts; ++i)
             {
                 verts[i] =  MemoryManager<SpatialDomains::PointGeom>::AllocateSharedPtr
                     ( three, i, point[i][0], point[i][1], point[i][2] );
             }
             const int nEdges = 8;
             const int vertexConnectivity[][2] = {
                 {0,1}, {1,2}, {2,3}, {3,0},
                 {0,4}, {1,4}, {2,4}, {3,4}
             };

             // Populate the list of edges
             SpatialDomains::SegGeomSharedPtr edges[nEdges];
             for(int i=0; i < nEdges; ++i)
             {
                 SpatialDomains::PointGeomSharedPtr vertsArray[2];
                 for(int j=0; j<2; ++j)
                 {
                     vertsArray[j] = verts[vertexConnectivity[i][j]];
                 }
                 edges[i] = MemoryManager<SpatialDomains::SegGeom>::AllocateSharedPtr(i, three, vertsArray);
             }

             ////////////////////////
             // Set up Pyramid faces //
             ////////////////////////

             const int nFaces = 5;
             //quad-edge connectivity base-face0,
             const int quadEdgeConnectivity[][4] = {{0,1,2,3}};

             //triangle-edge connectivity side-triface-1, side triface-2
             const int  triEdgeConnectivity[][3] = { {0,5,4}, {1,6,5}, {2,7,6}, {3,4,7}};

             // Populate the list of faces
             SpatialDomains::Geometry2DSharedPtr faces[nFaces];
             for(int f = 0; f < nFaces; ++f)
             {
                 if(f == 0)
                 {
                     SpatialDomains::SegGeomSharedPtr edgeArray[4];
                     for(int j=0; j < 4; ++j)
                     {
                         edgeArray[j] = edges[quadEdgeConnectivity[f][j]];
                     }

                     faces[f] = MemoryManager<SpatialDomains::QuadGeom>::AllocateSharedPtr(f,edgeArray);
                 }
                 else {
                     int i = f-1;
                     SpatialDomains::SegGeomSharedPtr edgeArray[3];
                     for(int j = 0; j < 3; ++j)
                     {
                         edgeArray[j] = edges[triEdgeConnectivity[i][j]];
                     }
                     faces[f] = MemoryManager<SpatialDomains::TriGeom>::AllocateSharedPtr(f, edgeArray);
                 }
             }

             SpatialDomains::PyrGeomSharedPtr geom =
                 MemoryManager<SpatialDomains::PyrGeom>::AllocateSharedPtr(0,faces);

             return geom;
         }

         /**
          *\brief Sets up the reference tretrahedral element needed to construct
          *a low energy basis
          */
         SpatialDomains::TetGeomSharedPtr PreconditionerLowEnergy::CreateRefTetGeom()
         {
             /////////////////////////////////
             // Set up Tetrahedron vertices //
             /////////////////////////////////

         int i,j;
         const int three=3;
             const int nVerts = 4;
             const double point[][3] = {
                 {-1,-1/sqrt(double(3)),-1/sqrt(double(6))},
                 {1,-1/sqrt(double(3)),-1/sqrt(double(6))},
                 {0,2/sqrt(double(3)),-1/sqrt(double(6))},
                 {0,0,3/sqrt(double(6))}};

             std::shared_ptr<SpatialDomains::PointGeom> verts[4];
         for(i=0; i < nVerts; ++i)
         {
             verts[i] =
                     MemoryManager<SpatialDomains::PointGeom>::
                     AllocateSharedPtr
                     ( three, i, point[i][0], point[i][1], point[i][2] );
         }

             //////////////////////////////
             // Set up Tetrahedron Edges //
             //////////////////////////////

             // SegGeom (int id, const int coordim), EdgeComponent(id, coordim)
             const int nEdges = 6;
             const int vertexConnectivity[][2] = {
                 {0,1},{1,2},{0,2},{0,3},{1,3},{2,3}
             };

             // Populate the list of edges
             SpatialDomains::SegGeomSharedPtr edges[nEdges];
             for(i=0; i < nEdges; ++i)
             {
                 std::shared_ptr<SpatialDomains::PointGeom>
                     vertsArray[2];
                 for(j=0; j<2; ++j)
                 {
                     vertsArray[j] = verts[vertexConnectivity[i][j]];
                 }

                 edges[i] = MemoryManager<SpatialDomains::SegGeom>
                     ::AllocateSharedPtr(i, three, vertsArray);
             }

             //////////////////////////////
             // Set up Tetrahedron faces //
             //////////////////////////////

             const int nFaces = 4;
             const int edgeConnectivity[][3] = {
                 {0,1,2}, {0,4,3}, {1,5,4}, {2,5,3}
             };

             // Populate the list of faces
             SpatialDomains::TriGeomSharedPtr faces[nFaces];
             for(i=0; i < nFaces; ++i)
             {
                 SpatialDomains::SegGeomSharedPtr edgeArray[3];
                 for(j=0; j < 3; ++j)
                 {
                     edgeArray[j] = edges[edgeConnectivity[i][j]];
                 }


                 faces[i] = MemoryManager<SpatialDomains::TriGeom>
                     ::AllocateSharedPtr(i, edgeArray);
             }

             SpatialDomains::TetGeomSharedPtr geom =
                 MemoryManager<SpatialDomains::TetGeom>::AllocateSharedPtr
                 (0, faces);

             return geom;
         }

         /**
          *\brief Sets up the reference hexahedral element needed to construct
          *a low energy basis
          */
         SpatialDomains::HexGeomSharedPtr PreconditionerLowEnergy::CreateRefHexGeom()
         {
             ////////////////////////////////
             // Set up Hexahedron vertices //
             ////////////////////////////////

         const int three=3;

             const int nVerts = 8;
             const double point[][3] = {
                 {0,0,0}, {1,0,0}, {1,1,0}, {0,1,0},
                 {0,0,1}, {1,0,1}, {1,1,1}, {0,1,1}
             };

             // Populate the list of verts
             SpatialDomains::PointGeomSharedPtr verts[8];
             for( int i = 0; i < nVerts; ++i ) {
                 verts[i] = MemoryManager<SpatialDomains::PointGeom>
                     ::AllocateSharedPtr(three,  i,   point[i][0],
                                         point[i][1], point[i][2]);
             }

             /////////////////////////////
             // Set up Hexahedron Edges //
             /////////////////////////////

             // SegGeom (int id, const int coordim), EdgeComponent(id, coordim)
             const int nEdges = 12;
             const int vertexConnectivity[][2] = {
                 {0,1}, {1,2}, {2,3}, {0,3}, {0,4}, {1,5},
                 {2,6}, {3,7}, {4,5}, {5,6}, {6,7}, {4,7}
             };

             // Populate the list of edges
             SpatialDomains::SegGeomSharedPtr edges[nEdges];
             for( int i = 0; i < nEdges; ++i ) {
                 SpatialDomains::PointGeomSharedPtr vertsArray[2];
                 for( int j = 0; j < 2; ++j ) {
                     vertsArray[j] = verts[vertexConnectivity[i][j]];
                 }
                 edges[i] = MemoryManager<SpatialDomains::SegGeom>::
                     AllocateSharedPtr( i, three, vertsArray);
             }

             /////////////////////////////
             // Set up Hexahedron faces //
             /////////////////////////////

             const int nFaces = 6;
             const int edgeConnectivity[][4] = {
                 {0,1,2,3}, {0,5,8,4}, {1,6,9,5},
                 {2,7,10,6}, {3,7,11,4}, {8,9,10,11}
             };

             // Populate the list of faces
             SpatialDomains::QuadGeomSharedPtr faces[nFaces];
             for( int i = 0; i < nFaces; ++i ) {
                 SpatialDomains::SegGeomSharedPtr edgeArray[4];
                 for( int j = 0; j < 4; ++j ) {
                     edgeArray[j]    = edges[edgeConnectivity[i][j]];
                 }
                 faces[i] = MemoryManager<SpatialDomains::QuadGeom>::AllocateSharedPtr(i, edgeArray);
             }

             SpatialDomains::HexGeomSharedPtr geom =
                 MemoryManager<SpatialDomains::HexGeom>::AllocateSharedPtr
                 (0, faces);

             return geom;
         }


         /**
      * \brief Loop expansion and determine different variants of the
      * transformation matrix
      *
          * Sets up multiple reference elements based on the element expansion.
      */
         void PreconditionerLowEnergy::SetUpReferenceElements(
                  std::map<ShapeType, DNekScalMatSharedPtr> &maxRmat,
                  map<ShapeType, LocalRegions::ExpansionSharedPtr > &maxElmt,
                  map<ShapeType, Array<OneD, unsigned int> >        &vertMapMaxR,
                  map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &edgeMapMaxR)
         {

             std::shared_ptr<MultiRegions::ExpList>
                 expList=((m_linsys.lock())->GetLocMat()).lock();
             GlobalLinSysKey linSysKey=(m_linsys.lock())->GetKey();

             LocalRegions::ExpansionSharedPtr locExp;

             // face maps for pyramid and hybrid meshes - not need to return.
             map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > faceMapMaxR;

             /* Determine the maximum expansion order for all elements */
             int nummodesmax = 0;
             Array<OneD, int> Shapes(LibUtilities::SIZE_ShapeType,0);

             for(int n = 0; n < expList->GetNumElmts(); ++n)
             {
                 locExp = expList->GetExp(n);

                 nummodesmax = max(nummodesmax, locExp->GetBasisNumModes(0));
                 nummodesmax = max(nummodesmax, locExp->GetBasisNumModes(1));
                 nummodesmax = max(nummodesmax, locExp->GetBasisNumModes(2));

                 Shapes[locExp->DetShapeType()] = 1;
             }


             m_comm->AllReduce(nummodesmax, ReduceMax);
             m_comm->AllReduce(Shapes, ReduceMax);

             if(Shapes[ePyramid]) // if Pyramids used then need Tet and Hex expansion
         {
                 Shapes[eTetrahedron] = 1;
                 Shapes[eHexahedron]  = 1;
             }

             StdRegions::MatrixType PreconR;
             if(linSysKey.GetMatrixType() == StdRegions::eMass)
             {
                 PreconR  = StdRegions::ePreconRMass;
             }
             else
             {
                 PreconR  = StdRegions::ePreconR;
             }

             Array<OneD, unsigned int>  vmap;
             Array<OneD, Array<OneD, unsigned int> > emap;
             Array<OneD, Array<OneD, unsigned int> > fmap;

             /*
              * Set up a transformation matrices for equal max order
              * polynomial meshes
              */

             if(Shapes[eHexahedron])
             {
                 SpatialDomains::HexGeomSharedPtr   hexgeom   = CreateRefHexGeom();
                 //Bases for Hex element
                 const BasisKey HexBa(eModified_A, nummodesmax,
                                  PointsKey(nummodesmax+1, eGaussLobattoLegendre));
                 const BasisKey HexBb(eModified_A, nummodesmax,
                                  PointsKey(nummodesmax+1,  eGaussLobattoLegendre));
                 const BasisKey HexBc(eModified_A, nummodesmax,
                                PointsKey(nummodesmax+1,  eGaussLobattoLegendre));

                 //Create reference Hexahdedral expansion
                 LocalRegions::HexExpSharedPtr HexExp;

                 HexExp = MemoryManager<LocalRegions::HexExp>
                     ::AllocateSharedPtr(HexBa,HexBb,HexBc,
                                         hexgeom);

                 maxElmt[eHexahedron] = HexExp;

                 // Hex:
                 HexExp->GetInverseBoundaryMaps(vmap,emap,fmap);
                 vertMapMaxR[eHexahedron] = vmap;
                 edgeMapMaxR[eHexahedron] = emap;
                 faceMapMaxR[eHexahedron] = fmap;

                 //Get hexahedral transformation matrix
                 LocalRegions::MatrixKey HexR
                     (PreconR, eHexahedron,
                      *HexExp, linSysKey.GetConstFactors());
                 maxRmat[eHexahedron] = HexExp->GetLocMatrix(HexR);
             }

             if(Shapes[eTetrahedron])
             {
                 SpatialDomains::TetGeomSharedPtr   tetgeom   = CreateRefTetGeom();
                 //Bases for Tetrahedral element
                 const BasisKey TetBa(eModified_A, nummodesmax,
                                      PointsKey(nummodesmax+1, eGaussLobattoLegendre));
                 const BasisKey TetBb(eModified_B, nummodesmax,
                                      PointsKey(nummodesmax,  eGaussRadauMAlpha1Beta0));
                 const BasisKey TetBc(eModified_C, nummodesmax,
                                      PointsKey(nummodesmax,  eGaussRadauMAlpha2Beta0));

                 //Create reference tetrahedral expansion
                 LocalRegions::TetExpSharedPtr TetExp;

                 TetExp = MemoryManager<LocalRegions::TetExp>
                     ::AllocateSharedPtr(TetBa,TetBb,TetBc,tetgeom);

                 maxElmt[eTetrahedron] = TetExp;

                 TetExp->GetInverseBoundaryMaps(vmap,emap,fmap);
                 vertMapMaxR[eTetrahedron] = vmap;
                 edgeMapMaxR[eTetrahedron] = emap;
                 faceMapMaxR[eTetrahedron] = fmap;

                 //Get tetrahedral transformation matrix
                 LocalRegions::MatrixKey TetR
                     (PreconR, eTetrahedron,
                      *TetExp, linSysKey.GetConstFactors());
                 maxRmat[eTetrahedron] = TetExp->GetLocMatrix(TetR);

                 if((Shapes[ePyramid])||(Shapes[eHexahedron]))
                 {
                     ReSetTetMaxRMat(nummodesmax, TetExp, maxRmat,
                                     vertMapMaxR, edgeMapMaxR, faceMapMaxR);
                 }
             }

             if(Shapes[ePyramid])
             {
                 SpatialDomains::PyrGeomSharedPtr   pyrgeom   = CreateRefPyrGeom();

                 //Bases for Pyramid element
                 const BasisKey PyrBa(eModified_A, nummodesmax,
                                      PointsKey(nummodesmax+1, eGaussLobattoLegendre));
                 const BasisKey PyrBb(eModified_A, nummodesmax,
                                      PointsKey(nummodesmax+1, eGaussLobattoLegendre));
                 const BasisKey PyrBc(eModifiedPyr_C, nummodesmax,
                                      PointsKey(nummodesmax,  eGaussRadauMAlpha2Beta0));

                 //Create reference pyramid expansion
                 LocalRegions::PyrExpSharedPtr PyrExp;

                 PyrExp = MemoryManager<LocalRegions::PyrExp>
                     ::AllocateSharedPtr(PyrBa,PyrBb,PyrBc,pyrgeom);

                 maxElmt[ePyramid] = PyrExp;

                 // Pyramid:
                 PyrExp->GetInverseBoundaryMaps(vmap,emap,fmap);
                 vertMapMaxR[ePyramid] = vmap;
                 edgeMapMaxR[ePyramid] = emap;
                 faceMapMaxR[ePyramid] = fmap;

                 // Set up Pyramid Transformation Matrix based on Tet
                 // and Hex expansion
                 SetUpPyrMaxRMat(nummodesmax,PyrExp,maxRmat,vertMapMaxR,
                                 edgeMapMaxR,faceMapMaxR);
             }

             if(Shapes[ePrism])
             {
                 SpatialDomains::PrismGeomSharedPtr prismgeom = CreateRefPrismGeom();
                 //Bases for Prism element
                 const BasisKey PrismBa(eModified_A, nummodesmax,
                                   PointsKey(nummodesmax+1, eGaussLobattoLegendre));
                 const BasisKey PrismBb(eModified_A, nummodesmax,
                                   PointsKey(nummodesmax+1, eGaussLobattoLegendre));
                 const BasisKey PrismBc(eModified_B, nummodesmax,
                                   PointsKey(nummodesmax,   eGaussRadauMAlpha1Beta0));

                 //Create reference prismatic expansion
                 LocalRegions::PrismExpSharedPtr PrismExp;

                 PrismExp = MemoryManager<LocalRegions::PrismExp>
                     ::AllocateSharedPtr(PrismBa,PrismBb,PrismBc,prismgeom);
                 maxElmt[ePrism] = PrismExp;

                 // Prism:
                 PrismExp->GetInverseBoundaryMaps(vmap,emap,fmap);
                 vertMapMaxR[ePrism] = vmap;
                 edgeMapMaxR[ePrism] = emap;

                 faceMapMaxR[ePrism] = fmap;

                 if((Shapes[ePyramid])||(Shapes[eHexahedron]))
                 {
             ReSetPrismMaxRMat(nummodesmax, PrismExp, maxRmat,
                                       vertMapMaxR, edgeMapMaxR,
                                       faceMapMaxR, false);
                 }
                 else
                 {

                     //Get prismatic transformation matrix
                     LocalRegions::MatrixKey PrismR
                         (PreconR, ePrism,
                          *PrismExp, linSysKey.GetConstFactors());
                     maxRmat[ePrism] =
                         PrismExp->GetLocMatrix(PrismR);

                     if(Shapes[eTetrahedron]) // reset triangular faces from Tet
                     {
                         ReSetPrismMaxRMat(nummodesmax, PrismExp, maxRmat,
                                           vertMapMaxR, edgeMapMaxR,
                                           faceMapMaxR, true);
                     }
                 }
             }
         }

         void PreconditionerLowEnergy::SetUpPyrMaxRMat(int nummodesmax,
                              LocalRegions::PyrExpSharedPtr &PyrExp,
                              std::map<ShapeType, DNekScalMatSharedPtr> &maxRmat,
                              std::map<ShapeType, Array<OneD, unsigned int> >        &vertMapMaxR,
                              std::map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &edgeMapMaxR,
                              std::map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &faceMapMaxR)
         {
             int nRows = PyrExp->NumBndryCoeffs();
             NekDouble val;
             NekDouble zero = 0.0;
             DNekMatSharedPtr newmat = MemoryManager<DNekMat>::
                 AllocateSharedPtr(nRows,nRows,zero,eFULL);

             // set diagonal to 1
             for(int i = 0; i < nRows; ++i)
             {
                 newmat->SetValue(i,i,1.0);
             }

             // The following lists specify the number of adjacent
             // edges to each vertex (nadj) then the Hex vert to
             // use for each pyramid ver in the vert-edge map (VEVert)
             // followed by the hex edge to use for each pyramid edge
             // in the vert-edge map (VEEdge)
             const int nadjedge[]     = {3,3,3,3,4};
             const int VEHexVert[][4] = {{0,0,0,-1},{1,1,1,-1},{2,2,2,-1},{3,3,3,-1},{4,5,6,7}};
             const int VEHexEdge[][4] = {{0,3,4,-1},{0,1,5,-1},{1,2,6,-1},{2,3,7,-1},{4,5,6,7}};
             const int VEPyrEdge[][4] = {{0,3,4,-1},{0,1,5,-1},{1,2,6,-1},{2,3,7,-1},{4,5,6,7}};

             // fill vertex to edge coupling
             for(int v = 0; v < 5; ++v)
             {
                 for(int e = 0; e < nadjedge[v]; ++e)
                 {
                     for(int i = 0; i < nummodesmax-2; ++i)
                     {
                         // Note this is using wrong shape but gives
                         // answer that seems to have correct error!
                         val = (*maxRmat[eHexahedron])(
                                     vertMapMaxR[eHexahedron][VEHexVert[v][e]],
                                     edgeMapMaxR[eHexahedron][VEHexEdge[v][e]][i]);
                         newmat->SetValue(vertMapMaxR[ePyramid][v],
                                          edgeMapMaxR[ePyramid][VEPyrEdge[v][e]][i],val);
                     }
                 }
             }

             int nfacemodes;
             nfacemodes = (nummodesmax-2)*(nummodesmax-2);
             // First four verties are all adjacent to base face
             for(int v = 0; v < 4; ++v)
             {
                 for(int i = 0; i < nfacemodes; ++i)
                 {
                     val = (*maxRmat[eHexahedron])(vertMapMaxR[eHexahedron][v],
                                                   faceMapMaxR[eHexahedron][0][i]);
                     newmat->SetValue(vertMapMaxR[ePyramid][v],
                                      faceMapMaxR[ePyramid][0][i],val);
                 }
             }


             const int nadjface[]     = {2,2,2,2,4};
             const int VFTetVert[][4] = {{0,0,-1,-1},{1,1,-1,-1},{2,2,-1,-1},{0,2,-1,-1},{3,3,3,3}};
             const int VFTetFace[][4] = {{1,3,-1,-1},{1,2,-1,-1},{2,3,-1,-1},{1,3,-1,-1},{1,2,1,2}};
             const int VFPyrFace[][4] = {{1,4,-1,-1},{1,2,-1,-1},{2,3,-1,-1},{3,4,-1,-1},{1,2,3,4}};

             // next handle all triangular faces from tetrahedron
             nfacemodes = (nummodesmax-3)*(nummodesmax-2)/2;
             for(int v = 0; v < 5; ++v)
             {
                 for(int f = 0; f < nadjface[v]; ++f)
                 {
                     for(int i = 0; i < nfacemodes; ++i)
                     {
                         val = (*maxRmat[eTetrahedron])(vertMapMaxR[eTetrahedron][VFTetVert[v][f]],
                                                        faceMapMaxR[eTetrahedron][VFTetFace[v][f]][i]);
                         newmat->SetValue(vertMapMaxR[ePyramid][v],
                                          faceMapMaxR[ePyramid][VFPyrFace[v][f]][i],val);
                     }

                 }
             }

             // Edge to face coupling
             // all base edges are coupled to face 0
             nfacemodes = (nummodesmax-2)*(nummodesmax-2);
             for(int e = 0; e < 4; ++e)
             {
                 for(int i = 0; i < nummodesmax-2; ++i)
                 {
                     for(int j = 0; j < nfacemodes; ++j)
                     {
                         int edgemapid = edgeMapMaxR[eHexahedron][e][i];
                         int facemapid = faceMapMaxR[eHexahedron][0][j];

                         val = (*maxRmat[eHexahedron])(edgemapid,facemapid);
                         newmat->SetValue(edgeMapMaxR[ePyramid][e][i],
                                          faceMapMaxR[ePyramid][0][j],val);
                     }

                 }
             }

             const int nadjface1[]    = {1,1,1,1,2,2,2,2};
             const int EFTetEdge[][2] = {{0,-1},{1,-1},{0,-1},{2,-1},{3,3},{4,4},{5,5},{3,5}};
             const int EFTetFace[][2] = {{1,-1},{2,-1},{1,-1},{3,-1},{1,3},{1,2},{2,3},{1,3}};
             const int EFPyrFace[][2] = {{1,-1},{2,-1},{3,-1},{4,-1},{1,4},{1,2},{2,3},{3,4}};

             // next handle all triangular faces from tetrahedron
             nfacemodes = (nummodesmax-3)*(nummodesmax-2)/2;
             for(int e = 0; e < 8; ++e)
             {
                 for(int f = 0; f < nadjface1[e]; ++f)
                 {
                     for(int i = 0; i < nummodesmax-2; ++i)
                     {
                         for(int j = 0; j < nfacemodes; ++j)
                         {
                             int edgemapid = edgeMapMaxR[eTetrahedron][EFTetEdge[e][f]][i];
                             int facemapid = faceMapMaxR[eTetrahedron][EFTetFace[e][f]][j];

                             val = (*maxRmat[eTetrahedron])(edgemapid,facemapid);
                             newmat->SetValue(edgeMapMaxR[ePyramid][e][i],
                                              faceMapMaxR[ePyramid][EFPyrFace[e][f]][j],val);
                         }
                     }
                 }
             }

             DNekScalMatSharedPtr PyrR;
             PyrR = MemoryManager<DNekScalMat>::AllocateSharedPtr(1.0, newmat);
             maxRmat[ePyramid] =PyrR;
         }


         void PreconditionerLowEnergy::ReSetTetMaxRMat(int nummodesmax,
                              LocalRegions::TetExpSharedPtr &TetExp,
                              std::map<ShapeType, DNekScalMatSharedPtr> &maxRmat,
                              std::map<ShapeType, Array<OneD, unsigned int> >        &vertMapMaxR,
                              std::map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &edgeMapMaxR,
                              std::map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &faceMapMaxR)
         {
             boost::ignore_unused(faceMapMaxR);

             int nRows = TetExp->NumBndryCoeffs();
             NekDouble val;
             NekDouble zero = 0.0;
             DNekMatSharedPtr newmat = MemoryManager<DNekMat>::
                 AllocateSharedPtr(nRows,nRows,zero,eFULL);

             // copy existing system
             for(int i = 0; i < nRows; ++i)
             {
                 for(int j = 0; j < nRows; ++j)
                 {
                     val = (*maxRmat[eTetrahedron])(i,j);
                     newmat->SetValue(i,j,val);
                 }
             }

             // The following lists specify the number of adjacent
             // edges to each vertex (nadj) then the Hex vert to
             // use for each pyramid ver in the vert-edge map (VEVert)
             // followed by the hex edge to use for each Tet edge
             // in the vert-edge map (VEEdge)
             const int VEHexVert[][4] = {{0,0,0},{1,1,1},{2,2,2},{4,5,6}};
             const int VEHexEdge[][4] = {{0,3,4},{0,1,5},{1,2,6},{4,5,6}};
             const int VETetEdge[][4] = {{0,2,3},{0,1,4},{1,2,5},{3,4,5}};

             // fill vertex to edge coupling
             for(int v = 0; v < 4; ++v)
             {
                 for(int e = 0; e < 3; ++e)
                 {
                     for(int i = 0; i < nummodesmax-2; ++i)
                     {
                         // Note this is using wrong shape but gives
                         // answer that seems to have correct error!
                         val = (*maxRmat[eHexahedron])(
                                     vertMapMaxR[eHexahedron][VEHexVert[v][e]],
                                     edgeMapMaxR[eHexahedron][VEHexEdge[v][e]][i]);
                         newmat->SetValue(vertMapMaxR[eTetrahedron][v],
                                     edgeMapMaxR[eTetrahedron][VETetEdge[v][e]][i],
                                                         val);
                     }
                 }
             }

             DNekScalMatSharedPtr TetR =
                 MemoryManager<DNekScalMat>::AllocateSharedPtr(1.0, newmat);

             maxRmat[eTetrahedron] = TetR;
         }

         void PreconditionerLowEnergy::ReSetPrismMaxRMat(int nummodesmax,
                              LocalRegions::PrismExpSharedPtr &PrismExp,
                              std::map<ShapeType, DNekScalMatSharedPtr> &maxRmat,
                              std::map<ShapeType, Array<OneD, unsigned int> >        &vertMapMaxR,
                              std::map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &edgeMapMaxR,
                              std::map<ShapeType, Array<OneD, Array<OneD, unsigned int> > > &faceMapMaxR,
                              bool UseTetOnly)
         {
             int nRows = PrismExp->NumBndryCoeffs();
             NekDouble val;
             NekDouble zero = 0.0;
             DNekMatSharedPtr newmat = MemoryManager<DNekMat>::
                 AllocateSharedPtr(nRows,nRows,zero,eFULL);


             int nfacemodes;

             if(UseTetOnly)
             {
                 // copy existing system
                 for(int i = 0; i < nRows; ++i)
                 {
                     for(int j = 0; j < nRows; ++j)
                     {
                         val = (*maxRmat[ePrism])(i,j);
                         newmat->SetValue(i,j,val);
                     }
                 }

                 // Reset vertex to edge mapping from tet.
                 const int VETetVert[][2]   = {{0,0},{1,1},{1,1},{0,0},{3,3},{3,3}};
                 const int VETetEdge[][2]   = {{0,3},{0,4},{0,4},{0,3},{3,4},{4,3}};
                 const int VEPrismEdge[][2] = {{0,4},{0,5},{2,6},{2,7},{4,5},{6,7}};

                 // fill vertex to edge coupling
                 for(int v = 0; v < 6; ++v)
                 {
                     for(int e = 0; e < 2; ++e)
                     {
                         for(int i = 0; i < nummodesmax-2; ++i)
                         {
                             // Note this is using wrong shape but gives
                             // answer that seems to have correct error!
                             val = (*maxRmat[eTetrahedron])(
                                    vertMapMaxR[eTetrahedron][VETetVert[v][e]],
                                    edgeMapMaxR[eTetrahedron][VETetEdge[v][e]][i]);
                             newmat->
                                 SetValue(vertMapMaxR[ePrism][v],
                                          edgeMapMaxR[ePrism][VEPrismEdge[v][e]][i],
                                          val);
                         }
                     }
                 }
             }
             else
             {

                 // set diagonal to 1
                 for(int i = 0; i < nRows; ++i)
                 {
                     newmat->SetValue(i,i,1.0);
                 }


                 // Set vertex to edge mapping from Hex.

                 // The following lists specify the number of adjacent
                 // edges to each vertex (nadj) then the Hex vert to
                 // use for each prism ver in the vert-edge map (VEVert)
                 // followed by the hex edge to use for each prism edge
                 // in the vert-edge map (VEEdge)
                 const int VEHexVert[][3]   = {{0,0,0},{1,1,1},{2,2,2},{3,3,3},
                                               {4,5,5},{6,7,7}};
                 const int VEHexEdge[][3]   = {{0,3,4},{0,1,5},{1,2,6},{2,3,7},
                                               {4,5,9},{6,7,11}};
                 const int VEPrismEdge[][3] = {{0,3,4},{0,1,5},{1,2,6},{2,3,7},
                                               {4,5,8},{6,7,8}};

                 // fill vertex to edge coupling
                 for(int v = 0; v < 6; ++v)
                 {
                     for(int e = 0; e < 3; ++e)
                     {
                         for(int i = 0; i < nummodesmax-2; ++i)
                         {
                             // Note this is using wrong shape but gives
                             // answer that seems to have correct error!
                             val = (*maxRmat[eHexahedron])(
                                     vertMapMaxR[eHexahedron][VEHexVert[v][e]],
                                     edgeMapMaxR[eHexahedron][VEHexEdge[v][e]][i]);
                             newmat->SetValue(vertMapMaxR[ePrism][v],
                                              edgeMapMaxR[ePrism][VEPrismEdge[v][e]][i],
                                              val);
                         }
                     }
                 }


                 // Setup vertex to face mapping from Hex
                 const int VFHexVert[][2]   = {{0,0},{1,1},{4,5},{2,2},{3,3},{6,7}};
                 const int VFHexFace[][2]   = {{0,4},{0,2},{4,2},{0,2},{0,4},{2,4}};

                 const int VQFPrismVert[][2] = {{0,0},{1,1},{4,4},{2,2},{3,3},{5,5}};
                 const int VQFPrismFace[][2] = {{0,4},{0,2},{4,2},{0,2},{0,4},{2,4}};

                 nfacemodes = (nummodesmax-2)*(nummodesmax-2);
                 // Replace two Quad faces  on every vertex
                 for(int v = 0; v < 6; ++v)
                 {
                     for(int f = 0; f < 2; ++f)
                     {
                         for(int i = 0; i < nfacemodes; ++i)
                         {
                             val = (*maxRmat[eHexahedron])(
                                              vertMapMaxR[eHexahedron][VFHexVert[v][f]],
                                              faceMapMaxR[eHexahedron][VFHexFace[v][f]][i]);
                             newmat->SetValue(vertMapMaxR[ePrism][VQFPrismVert[v][f]],
                                              faceMapMaxR[ePrism][VQFPrismFace[v][f]][i],val);
                         }
                     }
                 }

                 // Mapping of Hex Edge-Face mappings to Prism Edge-Face Mappings
                 const int nadjface[] = {1,2,1,2,1,1,1,1,2};
                 const int EFHexEdge[][2]    = {{0,-1},{1,1},{2,-1},{3,3},{4,-1},{5,-1},{6,-1},{7,-1},{9,11}};
                 const int EFHexFace[][2]    = {{0,-1},{0,2},{0,-1},{0,4},{4,-1},{2,-1},{2,-1},{4,-1},{2,4}};
                 const int EQFPrismEdge[][2] = {{0,-1},{1,1},{2,-1},{3,3},{4,-1},{5,-1},{6,-1},{7,-1},{8,8}};
                 const int EQFPrismFace[][2] = {{0,-1},{0,2},{0,-1},{0,4},{4,-1},{2,-1},{2,-1},{4,-1},{2,4}};

                 // all base edges are coupled to face 0
                 nfacemodes = (nummodesmax-2)*(nummodesmax-2);
                 for(int e = 0; e < 9; ++e)
                 {
                     for(int f = 0; f < nadjface[e]; ++f)
                     {
                         for(int i = 0; i < nummodesmax-2; ++i)
                         {
                             for(int j = 0; j < nfacemodes; ++j)
                             {
                                 int edgemapid = edgeMapMaxR[eHexahedron][EFHexEdge[e][f]][i];
                                 int facemapid = faceMapMaxR[eHexahedron][EFHexFace[e][f]][j];

                                 val = (*maxRmat[eHexahedron])(edgemapid,facemapid);

                                 int edgemapid1 = edgeMapMaxR[ePrism][EQFPrismEdge[e][f]][i];
                                 int facemapid1 = faceMapMaxR[ePrism][EQFPrismFace[e][f]][j];
                                 newmat->SetValue(edgemapid1, facemapid1, val);
                             }
                         }
                     }
                 }
             }

             const int VFTetVert[]    = {0,1,3,1,0,3};
             const int VFTetFace[]    = {1,1,1,1,1,1};
             const int VTFPrismVert[] = {0,1,4,2,3,5};
             const int VTFPrismFace[] = {1,1,1,3,3,3};

             //  Handle all triangular faces from tetrahedron
             nfacemodes = (nummodesmax-3)*(nummodesmax-2)/2;
             for(int v = 0; v < 6; ++v)
             {
                 for(int i = 0; i < nfacemodes; ++i)
                 {
                     val = (*maxRmat[eTetrahedron])
                         (vertMapMaxR[eTetrahedron][VFTetVert[v]],
                          faceMapMaxR[eTetrahedron][VFTetFace[v]][i]);

                     newmat->SetValue(vertMapMaxR[ePrism][VTFPrismVert[v]],
                                      faceMapMaxR[ePrism][VTFPrismFace[v]][i],val);
                 }
             }

             // Mapping of Tet Edge-Face mappings to Prism Edge-Face Mappings
             const int EFTetEdge[]    = {0,3,4,0,4,3};
             const int EFTetFace[]    = {1,1,1,1,1,1};
             const int ETFPrismEdge[] = {0,4,5,2,6,7};
             const int ETFPrismFace[] = {1,1,1,3,3,3};

             // handle all edge to triangular faces from tetrahedron
             // (only 6 this time)
             nfacemodes = (nummodesmax-3)*(nummodesmax-2)/2;
             for(int e = 0; e < 6; ++e)
             {
                 for(int i = 0; i < nummodesmax-2; ++i)
                 {
                     for(int j = 0; j < nfacemodes; ++j)
                     {
                         int edgemapid = edgeMapMaxR[eTetrahedron][EFTetEdge[e]][i];
                         int facemapid = faceMapMaxR[eTetrahedron][EFTetFace[e]][j];
                         val = (*maxRmat[eTetrahedron])(edgemapid,facemapid);

                         newmat->SetValue(edgeMapMaxR[ePrism][ETFPrismEdge[e]][i],
                                          faceMapMaxR[ePrism][ETFPrismFace[e]][j],val);
                     }
                 }
             }


             DNekScalMatSharedPtr PrismR
                 = MemoryManager<DNekScalMat>::AllocateSharedPtr(1.0, newmat);
             maxRmat[ePrism] = PrismR;
         }

         DNekMatSharedPtr PreconditionerLowEnergy::
         ExtractLocMat(StdRegions::StdExpansionSharedPtr &locExp,
                       DNekScalMatSharedPtr              &maxRmat,
                       LocalRegions::ExpansionSharedPtr  &maxExp,
                       Array<OneD, unsigned int>         &vmap,
                       Array<OneD, Array<OneD, unsigned int> > &emap)
         {
             NekDouble val;
             NekDouble zero = 0.0;

             int nRows = locExp->NumBndryCoeffs();
             DNekMatSharedPtr newmat = MemoryManager<DNekMat>::
                 AllocateSharedPtr(nRows,nRows,zero,eFULL);

             Array<OneD, unsigned int>  vlocmap;
             Array<OneD, Array<OneD, unsigned int> > elocmap;
             Array<OneD, Array<OneD, unsigned int> > flocmap;

             locExp->GetInverseBoundaryMaps(vlocmap,elocmap,flocmap);

             // fill diagonal
             for(int i = 0; i < nRows; ++i)
             {
                 val = 1.0;
                 newmat->SetValue(i,i,val);
             }

             int nverts = locExp->GetNverts();
             int nedges = locExp->GetNedges();
             int nfaces = locExp->GetNfaces();

             // fill vertex to edge coupling
             for(int e = 0; e < nedges; ++e)
             {
                 int nEdgeInteriorCoeffs = locExp->GetEdgeNcoeffs(e) -2;

                 for(int v = 0; v < nverts; ++v)
                 {
                     for(int i = 0; i < nEdgeInteriorCoeffs; ++i)
                     {
                         val = (*maxRmat)(vmap[v],emap[e][i]);
                         newmat->SetValue(vlocmap[v],elocmap[e][i],val);
                     }
                 }
             }

             for(int f = 0; f < nfaces; ++f)
             {
                 // Get details to extrac this face from max reference matrix
                 StdRegions::Orientation FwdOrient = StdRegions::eDir1FwdDir1_Dir2FwdDir2;
                 int m0,m1; //Local face expansion orders.

                 int nFaceInteriorCoeffs = locExp->GetFaceIntNcoeffs(f);

                 locExp->GetFaceNumModes(f,FwdOrient,m0,m1);

                 Array<OneD, unsigned int> fmapRmat = maxExp->
                     GetFaceInverseBoundaryMap(f,FwdOrient, m0,m1);

                 // fill in vertex to face coupling
                 for(int v = 0; v < nverts; ++v)
                 {
                     for(int i = 0; i < nFaceInteriorCoeffs; ++i)
                     {
                         val = (*maxRmat)(vmap[v],fmapRmat[i]);
                         newmat->SetValue(vlocmap[v],flocmap[f][i],val);
                     }
                 }

                 // fill in edges to face coupling
                 for(int e = 0; e < nedges; ++e)
                 {
                     int nEdgeInteriorCoeffs = locExp->GetEdgeNcoeffs(e) -2;

                     for(int j = 0; j < nEdgeInteriorCoeffs; ++j)
                     {

                         for(int i = 0; i < nFaceInteriorCoeffs; ++i)
                         {
                             val = (*maxRmat)(emap[e][j],fmapRmat[i]);
                             newmat->SetValue(elocmap[e][j],flocmap[f][i],val);
                         }
                     }
                 }
             }

             return newmat;
         }
     }
 }

Nektar::LibUtilities::ShapeType
ShapeType
Definition: ShapeType.hpp:53

Nektar::MultiRegions::Preconditioner::m_comm
LibUtilities::CommSharedPtr m_comm
Definition: Preconditioner.h:137

Nektar::MultiRegions::PreconditionerLowEnergy::v_DoPreconditioner
virtual void v_DoPreconditioner(const Array< OneD, NekDouble > &pInput, Array< OneD, NekDouble > &pOutput)
Definition: PreconditionerLowEnergy.cpp:936

Nektar::MultiRegions::PreconditionerLowEnergy::m_sameBlock
std::vector< std::pair< int, int > > m_sameBlock
Definition: PreconditionerLowEnergy.h:91

Nektar::Array< OneD, NekDouble >

VDmathArray.hpp

ASSERTL0
#define ASSERTL0(condition, msg)
Definition: ErrorUtil.hpp:216

Nektar::MultiRegions::PreconditionerLowEnergy::v_TransformedSchurCompl
virtual DNekScalMatSharedPtr v_TransformedSchurCompl(int n, int offset, const std::shared_ptr< DNekScalMat > &loc_mat)
Set up the transformed block matrix system.
Definition: PreconditionerLowEnergy.cpp:1382

Nektar
Definition: CoupledSolver.h:1

Nektar::LibUtilities::eModified_C
Principle Modified Functions .
Definition: BasisType.h:50

Nektar::SpatialDomains::Geometry2DSharedPtr
std::shared_ptr< Geometry2D > Geometry2DSharedPtr
Definition: Geometry.h:65

Gs::Gather
static void Gather(Nektar::Array< OneD, NekDouble > pU, gs_op pOp, gs_data *pGsh, Nektar::Array< OneD, NekDouble > pBuffer=NullNekDouble1DArray)
Performs a gather-scatter operation of the provided values.
Definition: GsLib.hpp:245

Nektar::MultiRegions::PreconditionerLowEnergy::v_DoMultiplybyInverseTransposedTransformationMatrix
virtual void v_DoMultiplybyInverseTransposedTransformationMatrix(const Array< OneD, NekDouble > &pInput, Array< OneD, NekDouble > &pOutput)
Multiply by the block tranposed inverse transformation matrix.
Definition: PreconditionerLowEnergy.cpp:1321

Vmath::Gathr
void Gathr(int n, const T *x, const int *y, T *z)
Gather vector z[i] = x[y[i]].
Definition: Vmath.cpp:647

sign
#define sign(a, b)
return the sign(b)*a
Definition: Polylib.cpp:16

Nektar::LibUtilities::eModifiedPyr_C
Principle Modified Functions .
Definition: BasisType.h:52

Nektar::DNekScalMatSharedPtr
std::shared_ptr< DNekScalMat > DNekScalMatSharedPtr
Definition: NekMatrixFwd.hpp:69

CG_Iterations.loc
loc
Definition: CG_Iterations.py:323

Nektar::SpatialDomains::TetGeomSharedPtr
std::shared_ptr< TetGeom > TetGeomSharedPtr
Definition: TetGeom.h:88

Nektar::MultiRegions::PreconditionerLowEnergy::m_multiplicity
Array< OneD, NekDouble > m_multiplicity
Definition: PreconditionerLowEnergy.h:84

Nektar::MultiRegions::PreconditionerLowEnergy::m_locToGloSignMult
Array< OneD, NekDouble > m_locToGloSignMult
Definition: PreconditionerLowEnergy.h:83

Nektar::MultiRegions::ePETScStaticCond
Definition: MultiRegions.hpp:89

Nektar::DNekScalBlkMatSharedPtr
std::shared_ptr< DNekScalBlkMat > DNekScalBlkMatSharedPtr
Definition: NekTypeDefs.hpp:73

Nektar::MultiRegions::Preconditioner::m_linsys
const std::weak_ptr< GlobalLinSys > m_linsys
Definition: Preconditioner.h:133

Nektar::StdRegions::ePreconR
Definition: StdRegions.hpp:138

GlobalLinSys.h

Nektar::MultiRegions::PreconditionerLowEnergy::ExtractLocMat
DNekMatSharedPtr ExtractLocMat(StdRegions::StdExpansionSharedPtr &locExp, DNekScalMatSharedPtr &maxRmat, LocalRegions::ExpansionSharedPtr &expMax, Array< OneD, unsigned int > &vertMapMaxR, Array< OneD, Array< OneD, unsigned int > > &edgeMapMaxR)
Definition: PreconditionerLowEnergy.cpp:2458

Nektar::SpatialDomains::QuadGeomSharedPtr
std::shared_ptr< QuadGeom > QuadGeomSharedPtr
Definition: HexGeom.h:46

Nektar::MultiRegions::PreconditionerLowEnergy::v_InitObject
virtual void v_InitObject()
Definition: PreconditionerLowEnergy.cpp:74

Nektar::LocalRegions::HexExpSharedPtr
std::shared_ptr< HexExp > HexExpSharedPtr
Definition: HexExp.h:56

Nektar::MultiRegions::PreconditionerLowEnergy::ReSetTetMaxRMat
void ReSetTetMaxRMat(int nummodesmax, LocalRegions::TetExpSharedPtr &TetExp, ShapeToDNekMap &maxRmat, ShapeToIntArrayMap &vertMapMaxR, ShapeToIntArrayArrayMap &edgeMapMaxR, ShapeToIntArrayArrayMap &faceMapMaxR)
Definition: PreconditionerLowEnergy.cpp:2194

Nektar::MultiRegions::GlobalMatrixKey::GetConstFactors
const StdRegions::ConstFactorMap & GetConstFactors() const
Returns all the constants.
Definition: GlobalMatrixKey.h:149

Nektar::SpatialDomains::eDirichlet
Definition: Conditions.h:53

Nektar::LibUtilities::eModified_A
Principle Modified Functions .
Definition: BasisType.h:48

Nektar::NekMatrix
Definition: NekMatrixFwd.hpp:56

Nektar::eWrapper
Definition: PointerWrapper.h:44

Nektar::MultiRegions::GetPreconFactory
PreconFactory & GetPreconFactory()
Definition: Preconditioner.cpp:89

std
STL namespace.

Nektar::LibUtilities::eHexahedron
Definition: ShapeType.hpp:63

Nektar::LocalRegions::TetExpSharedPtr
std::shared_ptr< TetExp > TetExpSharedPtr
Definition: TetExp.h:226

Vmath::Sdiv
void Sdiv(int n, const T alpha, const T *x, const int incx, T *y, const int incy)
Scalar multiply y = alpha/y.
Definition: Vmath.cpp:274

GlobalMatrixKey.h

Nektar::MultiRegions::PreconditionerLowEnergy::m_BlkMat
DNekBlkMatSharedPtr m_BlkMat
Definition: PreconditionerLowEnergy.h:78

Nektar::DNekMatSharedPtr
std::shared_ptr< DNekMat > DNekMatSharedPtr
Definition: NekTypeDefs.hpp:69

PreconditionerLowEnergy.h

Blas::Dgemm
static void Dgemm(const char &transa, const char &transb, const int &m, const int &n, const int &k, const double &alpha, const double *a, const int &lda, const double *b, const int &ldb, const double &beta, double *c, const int &ldc)
BLAS level 3: Matrix-matrix multiply C = A x B where A[m x n], B[n x k], C[m x k].
Definition: Blas.hpp:213

Nektar::NekVector< NekDouble >

Nektar::LibUtilities::SIZE_ShapeType
Definition: ShapeType.hpp:64

Nektar::LibUtilities::eGaussRadauMAlpha1Beta0
Gauss Radau pinned at x=-1, .
Definition: PointsType.h:58

Nektar::MultiRegions::PreconditionerLowEnergy::CreateRefHexGeom
SpatialDomains::HexGeomSharedPtr CreateRefHexGeom(void)
Sets up the reference hexahedral element needed to construct a low energy basis.
Definition: PreconditionerLowEnergy.cpp:1767

Nektar::MultiRegions::AssemblyMapSharedPtr
std::shared_ptr< AssemblyMap > AssemblyMapSharedPtr
Definition: AssemblyMap.h:52

Gs::Init
static gs_data * Init(const Nektar::Array< OneD, long > pId, const LibUtilities::CommSharedPtr &pComm, bool verbose=true)
Initialise Gather-Scatter map.
Definition: GsLib.hpp:167

Nektar::LocalRegions::MatrixKey
Definition: MatrixKey.h:47

Nektar::MultiRegions::Preconditioner
Definition: Preconditioner.h:64

Nektar::StdRegions::StdExpansionSharedPtr
std::shared_ptr< StdExpansion > StdExpansionSharedPtr
Definition: StdExpansion.h:1926

Nektar::MatrixStorage
MatrixStorage
Definition: MatrixStorageType.h:41

Nektar::SpatialDomains::TriGeomSharedPtr
std::shared_ptr< TriGeom > TriGeomSharedPtr
Definition: TriGeom.h:58

Nektar::MultiRegions::PreconditionerLowEnergy::v_BuildPreconditioner
virtual void v_BuildPreconditioner()
Construct the low energy preconditioner from .
Definition: PreconditionerLowEnergy.cpp:121

Nektar::MultiRegions::GlobalMatrixKey::GetMatrixType
StdRegions::MatrixType GetMatrixType() const
Return the matrix type.
Definition: GlobalMatrixKey.h:115

Nektar::MultiRegions::PreconditionerLowEnergy::m_signChange
bool m_signChange
Definition: PreconditionerLowEnergy.h:87

Nektar::MultiRegions::PreconditionerLowEnergy::m_map
Array< OneD, int > m_map
Definition: PreconditionerLowEnergy.h:85

Nektar::LibUtilities::eModified_B
Principle Modified Functions .
Definition: BasisType.h:49

Nektar::MultiRegions::DeterminePeriodicFaceOrient
StdRegions::Orientation DeterminePeriodicFaceOrient(StdRegions::Orientation faceOrient, StdRegions::Orientation perFaceOrient)
Determine relative orientation between two faces.
Definition: AssemblyMapCG.cpp:2137

Nektar::MultiRegions::PreconditionerLowEnergy::m_RBlk
DNekBlkMatSharedPtr m_RBlk
Definition: PreconditionerLowEnergy.h:79

Nektar::MultiRegions::PreconditionerLowEnergy::m_InvRBlk
DNekBlkMatSharedPtr m_InvRBlk
Definition: PreconditionerLowEnergy.h:80

Gs::gs_min
Definition: GsLib.hpp:53

Nektar::MultiRegions::PreconditionerLowEnergy::SetUpPyrMaxRMat
void SetUpPyrMaxRMat(int nummodesmax, LocalRegions::PyrExpSharedPtr &PyrExp, ShapeToDNekMap &maxRmat, ShapeToIntArrayMap &vertMapMaxR, ShapeToIntArrayArrayMap &edgeMapMaxR, ShapeToIntArrayArrayMap &faceMapMaxR)
Definition: PreconditionerLowEnergy.cpp:2058

Nektar::MemoryManager::AllocateSharedPtr
static std::shared_ptr< DataType > AllocateSharedPtr(const Args &...args)
Allocate a shared pointer from the memory pool.
Definition: NekMemoryManager.hpp:161

Nektar::MultiRegions::PreconditionerLowEnergy::v_DoTransformToLowEnergy
virtual void v_DoTransformToLowEnergy(Array< OneD, NekDouble > &pInOut, int offset)
Transform the solution vector vector to low energy.
Definition: PreconditionerLowEnergy.cpp:1076

Nektar::MultiRegions::PreconditionerLowEnergy::CreateRefPyrGeom
SpatialDomains::PyrGeomSharedPtr CreateRefPyrGeom(void)
Sets up the reference prismatic element needed to construct a low energy basis mapping arrays...
Definition: PreconditionerLowEnergy.cpp:1599

Nektar::Transpose
NekMatrix< InnerMatrixType, BlockMatrixTag > Transpose(NekMatrix< InnerMatrixType, BlockMatrixTag > &rhs)
Definition: BlockMatrix.hpp:217

Nektar::LibUtilities::PointsKey
Defines a specification for a set of points.
Definition: Points.h:59

Nektar::MultiRegions::PreconditionerLowEnergy::SetUpReferenceElements
void SetUpReferenceElements(ShapeToDNekMap &maxRmat, ShapeToExpMap &maxElmt, ShapeToIntArrayMap &vertMapMaxR, ShapeToIntArrayArrayMap &edgeMapMaxR)
Loop expansion and determine different variants of the transformation matrix.
Definition: PreconditionerLowEnergy.cpp:1845

Nektar::NekDouble
double NekDouble
Definition: NektarUnivTypeDefs.hpp:43

Vmath::Assmb
void Assmb(int n, const T *x, const int *y, T *z)
Assemble z[y[i]] += x[i]; z should be zero&#39;d first.
Definition: Vmath.cpp:712

Nektar::SpatialDomains::PointGeomSharedPtr
std::shared_ptr< PointGeom > PointGeomSharedPtr
Definition: Geometry.h:59

Nektar::MultiRegions::PeriodicMap
std::map< int, std::vector< PeriodicEntity > > PeriodicMap
Definition: MultiRegions.hpp:200

Nektar::eDIAGONAL
Definition: MatrixStorageType.h:44

Nektar::MultiRegions::PreconditionerLowEnergy::v_DoMultiplybyInverseTransformationMatrix
virtual void v_DoMultiplybyInverseTransformationMatrix(const Array< OneD, NekDouble > &pInput, Array< OneD, NekDouble > &pOutput)
Multiply by the block inverse transformation matrix.
Definition: PreconditionerLowEnergy.cpp:1258

Nektar::MultiRegions::GlobalLinSysKey
Describe a linear system.
Definition: GlobalLinSysKey.h:50

Nektar::MultiRegions::PreconditionerLowEnergy::v_DoTransformFromLowEnergy
virtual void v_DoTransformFromLowEnergy(Array< OneD, NekDouble > &pInOut)
transform the solution vector from low energy back to the original basis.
Definition: PreconditionerLowEnergy.cpp:1202

Nektar::LibUtilities::ReduceMax
Definition: Comm.h:68

Nektar::LocalRegions::PyrExpSharedPtr
std::shared_ptr< PyrExp > PyrExpSharedPtr
Definition: PyrExp.h:191

MatrixKey.h

point
bg::model::point< double, 3, bg::cs::cartesian > point
Definition: BLMesh.cpp:53

Nektar::MultiRegions::PreconditionerLowEnergy::CreateRefTetGeom
SpatialDomains::TetGeomSharedPtr CreateRefTetGeom(void)
Sets up the reference tretrahedral element needed to construct a low energy basis.
Definition: PreconditionerLowEnergy.cpp:1683

Nektar::LocalRegions::ExpansionSharedPtr
std::shared_ptr< Expansion > ExpansionSharedPtr
Definition: Expansion.h:65

Nektar::SpatialDomains::PyrGeomSharedPtr
std::shared_ptr< PyrGeom > PyrGeomSharedPtr
Definition: PyrGeom.h:80

Nektar::StdRegions::eMass
Definition: StdRegions.hpp:102

Nektar::LocalRegions::PrismExpSharedPtr
std::shared_ptr< PrismExp > PrismExpSharedPtr
Definition: PrismExp.h:220

Gs::gs_add
Definition: GsLib.hpp:53

Nektar::LocalRegions::Expansion2DSharedPtr
std::shared_ptr< Expansion2D > Expansion2DSharedPtr
Definition: Expansion1D.h:47

Nektar::StdRegions::StdExpansion::as
std::shared_ptr< T > as()
Definition: StdExpansion.h:1416

Nektar::SpatialDomains::HexGeomSharedPtr
std::shared_ptr< HexGeom > HexGeomSharedPtr
Definition: HexGeom.h:90

Gs::gs_data
Definition: GsLib.hpp:128

Nektar::LibUtilities::eGaussRadauMAlpha2Beta0
Gauss Radau pinned at x=-1, .
Definition: PointsType.h:59

Nektar::eFULL
Definition: MatrixStorageType.h:43

Nektar::MultiRegions::PreconditionerLowEnergy::SetupBlockTransformationMatrix
void SetupBlockTransformationMatrix(void)
Definition: PreconditionerLowEnergy.cpp:957

Nektar::OneD
Definition: NektarUnivTypeDefs.hpp:52

Nektar::LibUtilities::ePrism
Definition: ShapeType.hpp:62

Nektar::MultiRegions::PreconditionerLowEnergy::CreateRefPrismGeom
SpatialDomains::PrismGeomSharedPtr CreateRefPrismGeom(void)
Sets up the reference prismatic element needed to construct a low energy basis.
Definition: PreconditionerLowEnergy.cpp:1517

Nektar::MultiRegions::eIterativeStaticCond
Definition: MultiRegions.hpp:83

Nektar::MultiRegions::GlobalSysSolnType
GlobalSysSolnType
Definition: MultiRegions.hpp:76

Nektar::LibUtilities::NekFactory::RegisterCreatorFunction
tKey RegisterCreatorFunction(tKey idKey, CreatorFunction classCreator, std::string pDesc="")
Register a class with the factory.
Definition: NekFactory.hpp:199

Nektar::LibUtilities::eTetrahedron
Definition: ShapeType.hpp:60

Nektar::StdRegions::Orientation
Orientation
Definition: StdRegions.hpp:317

Nektar::SpatialDomains::PrismGeomSharedPtr
std::shared_ptr< PrismGeom > PrismGeomSharedPtr
Definition: PrismGeom.h:88

Nektar::StdRegions::eDir1FwdDir1_Dir2FwdDir2
Definition: StdRegions.hpp:324

Nektar::MultiRegions::PreconditionerLowEnergy::CreateMultiplicityMap
void CreateMultiplicityMap(void)
Definition: PreconditionerLowEnergy.cpp:1441

ASSERTL1
#define ASSERTL1(condition, msg)
Assert Level 1 – Debugging which is used whether in FULLDEBUG or DEBUG compilation mode...
Definition: ErrorUtil.hpp:250

Nektar::SpatialDomains::SegGeomSharedPtr
std::shared_ptr< SegGeom > SegGeomSharedPtr
Definition: Geometry2D.h:62

Vmath::Vcopy
void Vcopy(int n, const T *x, const int incx, T *y, const int incy)
Definition: Vmath.cpp:1064

Nektar::MultiRegions::Preconditioner::m_locToGloMap
std::weak_ptr< AssemblyMap > m_locToGloMap
Definition: Preconditioner.h:136

Nektar::MultiRegions::PreconditionerLowEnergy::ReSetPrismMaxRMat
void ReSetPrismMaxRMat(int nummodesmax, LocalRegions::PrismExpSharedPtr &PirsmExp, ShapeToDNekMap &maxRmat, ShapeToIntArrayMap &vertMapMaxR, ShapeToIntArrayArrayMap &edgeMapMaxR, ShapeToIntArrayArrayMap &faceMapMaxR, bool UseTetOnly)
Definition: PreconditionerLowEnergy.cpp:2253

Nektar::LocalRegions::Expansion2D
Definition: Expansion2D.h:58

Nektar::LibUtilities::BasisKey
Describes the specification for a Basis.
Definition: Basis.h:49

GlobalLinSysIterativeStaticCond.h

Nektar::StdRegions::MatrixType
MatrixType
Definition: StdRegions.hpp:100

Nektar::LibUtilities::eGaussLobattoLegendre
1D Gauss-Lobatto-Legendre quadrature points
Definition: PointsType.h:51

Nektar::LocalRegions::Expansion3D
Definition: Expansion3D.h:57

Vmath::Vmul
void Vmul(int n, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Multiply vector z = x*y.
Definition: Vmath.cpp:186

Nektar::LibUtilities::ePyramid
Definition: ShapeType.hpp:61

Nektar::StdRegions::ePreconRMass
Definition: StdRegions.hpp:139