Classes
class	BwdTrans_StdMat
	Backward transform operator using standard matrix approach. More...

class	BwdTrans_MatrixFree
	Backward transform operator using matrix free operators. More...

class	BwdTrans_IterPerExp
	Backward transform operator using default StdRegions operator. More...

class	BwdTrans_NoCollection
	Backward transform operator using LocalRegions implementation. More...

class	BwdTrans_SumFac_Seg
	Backward transform operator using sum-factorisation (Segment) More...

class	BwdTrans_SumFac_Quad
	Backward transform operator using sum-factorisation (Quad) More...

class	BwdTrans_SumFac_Tri
	Backward transform operator using sum-factorisation (Tri) More...

class	BwdTrans_SumFac_Hex
	Backward transform operator using sum-factorisation (Hex) More...

class	BwdTrans_SumFac_Tet
	Backward transform operator using sum-factorisation (Tet) More...

class	BwdTrans_SumFac_Prism
	Backward transform operator using sum-factorisation (Prism) More...

class	BwdTrans_SumFac_Pyr
	Backward transform operator using sum-factorisation (Pyr) More...

class	CoalescedGeomData

class	Collection
	Collection. More...

class	OpImpTimingKey

class	CollectionOptimisation

class	Helmholtz_NoCollection
	Helmholtz operator using LocalRegions implementation. More...

class	Helmholtz_IterPerExp
	Helmholtz operator using LocalRegions implementation. More...

class	Helmholtz_MatrixFree
	Helmholtz operator using matrix free operators. More...

class	IProductWRTBase_StdMat
	Inner product operator using standard matrix approach. More...

class	IProductWRTBase_MatrixFree
	Inner product operator using operator using matrix free operators. More...

class	IProductWRTBase_IterPerExp
	Inner product operator using element-wise operation. More...

class	IProductWRTBase_NoCollection
	Inner product operator using original MultiRegions implementation. More...

class	IProductWRTBase_SumFac_Seg
	Inner product operator using sum-factorisation (Segment) More...

class	IProductWRTBase_SumFac_Quad
	Inner product operator using sum-factorisation (Quad) More...

class	IProductWRTBase_SumFac_Tri
	Inner product operator using sum-factorisation (Tri) More...

class	IProductWRTBase_SumFac_Hex
	Inner Product operator using sum-factorisation (Hex) More...

class	IProductWRTBase_SumFac_Tet
	Inner product operator using sum-factorisation (Tet) More...

class	IProductWRTBase_SumFac_Prism
	Inner Product operator using sum-factorisation (Prism) More...

class	IProductWRTBase_SumFac_Pyr
	Inner Product operator using sum-factorisation (Pyr) More...

class	IProductWRTDerivBase_StdMat
	Inner product WRT deriv base operator using standard matrix approach. More...

class	IProductWRTDerivBase_MatrixFree
	Inner product operator using operator using matrix free operators. More...

class	IProductWRTDerivBase_IterPerExp
	Inner product WRT deriv base operator using element-wise operation. More...

class	IProductWRTDerivBase_NoCollection
	Inner product WRT deriv base operator using LocalRegions implementation. More...

class	IProductWRTDerivBase_SumFac_Seg
	Inner product WRT deriv base operator using sum-factorisation (Segment) More...

class	IProductWRTDerivBase_SumFac_Quad
	Inner product WRT deriv base operator using sum-factorisation (Quad) More...

class	IProductWRTDerivBase_SumFac_Tri
	Inner product WRT deriv base operator using sum-factorisation (Tri) More...

class	IProductWRTDerivBase_SumFac_Hex
	Inner product WRT deriv base operator using sum-factorisation (Hex) More...

class	IProductWRTDerivBase_SumFac_Tet
	Inner product WRT deriv base operator using sum-factorisation (Tet) More...

class	IProductWRTDerivBase_SumFac_Prism
	Inner product WRT deriv base operator using sum-factorisation (Prism) More...

class	IProductWRTDerivBase_SumFac_Pyr
	Inner product WRT deriv base operator using sum-factorisation (Pyr) More...

class	MatrixFreeBase

class	MatrixFreeOneInOneOut

class	MatrixFreeMultiInOneOut

class	MatrixFreeOneInMultiOut

class	Operator
	Base class for operators on a collection of elements. More...

class	PhysDeriv_StdMat
	Phys deriv operator using standard matrix approach. More...

class	PhysDeriv_MatrixFree
	Phys deriv operator using matrix free operators. More...

class	PhysDeriv_IterPerExp
	Phys deriv operator using element-wise operation. More...

class	PhysDeriv_NoCollection
	Phys deriv operator using original LocalRegions implementation. More...

class	PhysDeriv_SumFac_Seg
	Phys deriv operator using sum-factorisation (Segment) More...

class	PhysDeriv_SumFac_Quad
	Phys deriv operator using sum-factorisation (Quad) More...

class	PhysDeriv_SumFac_Tri
	Phys deriv operator using sum-factorisation (Tri) More...

class	PhysDeriv_SumFac_Hex
	Phys deriv operator using sum-factorisation (Hex) More...

class	PhysDeriv_SumFac_Tet
	Phys deriv operator using sum-factorisation (Tet) More...

class	PhysDeriv_SumFac_Prism
	Phys deriv operator using sum-factorisation (Prism) More...

class	PhysDeriv_SumFac_Pyr
	Phys deriv operator using sum-factorisation (Pyramid) More...

Typedefs
using	vec_t = simd< NekDouble >

typedef std::vector< vec_t, tinysimd::allocator< vec_t > >	VecVec_t

typedef std::shared_ptr< CoalescedGeomData >	CoalescedGeomDataSharedPtr

typedef std::vector< Collection >	CollectionVector

typedef std::shared_ptr< CollectionVector >	CollectionVectorSharedPtr

typedef bool	ExpansionIsNodal

typedef std::map< OperatorType, ImplementationType >	OperatorImpMap

typedef std::shared_ptr< Operator >	OperatorSharedPtr
	Shared pointer to an Operator object. More...

typedef std::tuple< LibUtilities::ShapeType, OperatorType, ImplementationType, ExpansionIsNodal >	OperatorKey
	Key for describing an Operator. More...

typedef Nektar::LibUtilities::NekFactory< OperatorKey, Operator, std::vector< StdRegions::StdExpansionSharedPtr >, CoalescedGeomDataSharedPtr, StdRegions::FactorMap >	OperatorFactory
	Operator factory definition. More...

Enumerations
enum	GeomData { eJac , eJacWithStdWeights , eDerivFactors }

enum	OperatorType { eBwdTrans , eHelmholtz , eIProductWRTBase , eIProductWRTDerivBase , ePhysDeriv , SIZE_OperatorType }

enum	ImplementationType { eNoImpType , eNoCollection , eIterPerExp , eStdMat , eSumFac , eMatrixFree , SIZE_ImplementationType }

Functions
void	QuadIProduct (bool colldir0, bool colldir1, int numElmt, int nquad0, int nquad1, int nmodes0, int nmodes1, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	TriIProduct (bool sortTopVertex, int numElmt, int nquad0, int nquad1, int nmodes0, int nmodes1, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	HexIProduct (bool colldir0, bool colldir1, bool colldir2, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	PrismIProduct (bool sortTopVert, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	PyrIProduct (bool sortTopVert, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	TetIProduct (bool sortTopEdge, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

bool	operator< (OperatorKey const &p1, OperatorKey const &p2)
	Less-than comparison operator for OperatorKey objects. More...

std::ostream &	operator<< (std::ostream &os, OperatorKey const &p)
	Stream output operator for OperatorKey objects. More...

OperatorFactory &	GetOperatorFactory ()
	Returns the singleton Operator factory object. More...

OperatorImpMap	SetFixedImpType (ImplementationType defaultType)
	simple Operator Implementation Map generator More...

Variables
static CoalescedGeomDataSharedPtr	GeomDataNull

const char *const	OperatorTypeMap []

const char *const	OperatorTypeMap1 []

const char *const	ImplementationTypeMap []

const char *const	ImplementationTypeMap1 []

Typedef Documentation

◆ CoalescedGeomDataSharedPtr

typedef std::shared_ptr< CoalescedGeomData > Nektar::Collections::CoalescedGeomDataSharedPtr

Definition at line 92 of file CoalescedGeomData.h.

◆ CollectionVector

typedef std::vector<Collection> Nektar::Collections::CollectionVector

Definition at line 110 of file Collection.h.

◆ CollectionVectorSharedPtr

typedef std::shared_ptr<CollectionVector> Nektar::Collections::CollectionVectorSharedPtr

Definition at line 111 of file Collection.h.

◆ ExpansionIsNodal

typedef bool Nektar::Collections::ExpansionIsNodal

Definition at line 110 of file Operator.h.

◆ OperatorFactory

typedef Nektar::LibUtilities::NekFactory< OperatorKey, Operator, std::vector<StdRegions::StdExpansionSharedPtr>, CoalescedGeomDataSharedPtr, StdRegions::FactorMap> Nektar::Collections::OperatorFactory

Operator factory definition.

Definition at line 189 of file Operator.h.

◆ OperatorImpMap

typedef std::map<OperatorType, ImplementationType> Nektar::Collections::OperatorImpMap

Definition at line 112 of file Operator.h.

◆ OperatorKey

typedef std::tuple<LibUtilities::ShapeType, OperatorType, ImplementationType, ExpansionIsNodal> Nektar::Collections::OperatorKey

Key for describing an Operator.

Definition at line 177 of file Operator.h.

◆ OperatorSharedPtr

typedef std::shared_ptr<Operator> Nektar::Collections::OperatorSharedPtr

Shared pointer to an Operator object.

Definition at line 172 of file Operator.h.

◆ vec_t

using Nektar::Collections::vec_t = typedef simd<NekDouble>

Definition at line 49 of file CoalescedGeomData.h.

◆ VecVec_t

typedef std::vector<vec_t, tinysimd::allocator<vec_t> > Nektar::Collections::VecVec_t

Definition at line 50 of file CoalescedGeomData.h.

Enumeration Type Documentation

◆ GeomData

enum Nektar::Collections::GeomData

Enumerator
eJac
eJacWithStdWeights
eDerivFactors

Definition at line 52 of file CoalescedGeomData.h.

 {
     eJac,
     eJacWithStdWeights,
     eDerivFactors
 };

◆ ImplementationType

enum Nektar::Collections::ImplementationType

Enumerator
eNoImpType
eNoCollection
eIterPerExp
eStdMat
eSumFac
eMatrixFree
SIZE_ImplementationType

Definition at line 83 of file Operator.h.

 {
     eNoImpType,
     eNoCollection,
     eIterPerExp,
     eStdMat,
     eSumFac,
     eMatrixFree,
     SIZE_ImplementationType
 };

◆ OperatorType

enum Nektar::Collections::OperatorType

Enumerator
eBwdTrans
eHelmholtz
eIProductWRTBase
eIProductWRTDerivBase
ePhysDeriv
SIZE_OperatorType

Definition at line 66 of file Operator.h.

 {
     eBwdTrans,
     eHelmholtz,
     eIProductWRTBase,
     eIProductWRTDerivBase,
     ePhysDeriv,
     SIZE_OperatorType
 };

Function Documentation

◆ GetOperatorFactory()

OperatorFactory & Nektar::Collections::GetOperatorFactory ( )

Returns the singleton Operator factory object.

Definition at line 117 of file Operator.cpp.

 {
     static OperatorFactory instance;
     return instance;
 }

Referenced by Nektar::Collections::BwdTrans_MatrixFree::BwdTrans_MatrixFree(), Nektar::Collections::Helmholtz_MatrixFree::Helmholtz_MatrixFree(), Nektar::Collections::Collection::Initialise(), Nektar::Collections::IProductWRTBase_MatrixFree::IProductWRTBase_MatrixFree(), Nektar::Collections::IProductWRTDerivBase_MatrixFree::IProductWRTDerivBase_MatrixFree(), Nektar::Collections::PhysDeriv_MatrixFree::PhysDeriv_MatrixFree(), and Nektar::Collections::CollectionOptimisation::SetWithTimings().

◆ HexIProduct()

void Nektar::Collections::HexIProduct	(	bool	colldir0,
		bool	colldir1,
		bool	colldir2,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 173 of file IProduct.cpp.

 {
     int totmodes  = nmodes0 * nmodes1 * nmodes2;
     int totpoints = nquad0 * nquad1 * nquad2;
  
     if (colldir0 && colldir1 && colldir2)
     {
  
         Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, output, 1);
     }
     else
     {
         Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
  
         // Assign second half of workspace for 2nd DGEMM operation.
         Array<OneD, NekDouble> wsp1 = wsp + totpoints * numElmt;
  
         // note sure what criterion we should use to swap around these
         // strategies
         if (numElmt < nmodes0 || 1)
         {
             Array<OneD, NekDouble> wsp2 = wsp1 + nmodes0 * nquad1 * nquad2;
  
             // loop over elements
             for (int n = 0; n < numElmt; ++n)
             {
                 if (colldir0)
                 {
  
                     for (int i = 0; i < nmodes0; ++i)
                     {
                         Vmath::Vcopy(nquad1 * nquad2, &wsp[n * totpoints] + i,
                                      nquad0, wsp1.get() + nquad1 * nquad2 * i,
                                      1);
                     }
                 }
                 else
                 {
                     Blas::Dgemm('T', 'N', nquad1 * nquad2, nmodes0, nquad0, 1.0,
                                 &wsp[n * totpoints], nquad0, base0.get(),
                                 nquad0, 0.0, wsp1.get(), nquad1 * nquad2);
                 }
  
                 if (colldir1)
                 {
                     // reshuffle data for next operation.
                     for (int i = 0; i < nmodes1; ++i)
                     {
                         Vmath::Vcopy(nquad2 * nmodes0, wsp1.get() + i, nquad1,
                                      wsp2.get() + nquad2 * nmodes0 * i, 1);
                     }
                 }
                 else
                 {
                     Blas::Dgemm('T', 'N', nquad2 * nmodes0, nmodes1, nquad1,
                                 1.0, wsp1.get(), nquad1, base1.get(), nquad1,
                                 0.0, wsp2.get(), nquad2 * nmodes0);
                 }
  
                 if (colldir2)
                 {
                     // reshuffle data for next operation.
                     for (int i = 0; i < nmodes2; ++i)
                     {
                         Vmath::Vcopy(
                             nmodes0 * nmodes1, wsp2.get() + i, nquad2,
                             &output[n * totmodes] + nmodes0 * nmodes1 * i, 1);
                     }
                 }
                 else
                 {
                     Blas::Dgemm('T', 'N', nmodes0 * nmodes1, nmodes2, nquad2,
                                 1.0, wsp2.get(), nquad2, base2.get(), nquad2,
                                 0.0, &output[n * totmodes], nmodes0 * nmodes1);
                 }
             }
         }
         else
         {
             Array<OneD, NekDouble> wsp2 =
                 wsp1 + numElmt * (max(totpoints, totmodes));
  
             if (colldir0)
             {
                 for (int i = 0; i < nquad0; ++i)
                 {
                     Vmath::Vcopy(nquad1 * nquad2 * numElmt, &wsp[i], nquad0,
                                  &wsp1[i * nquad1 * nquad2 * numElmt], 1);
                 }
             }
             else
             {
                 // large degmm but copy at end.
                 Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0,
                             nquad0, 1.0, &wsp[0], nquad0, base0.get(), nquad0,
                             0.0, &wsp1[0], nquad1 * nquad2 * numElmt);
             }
  
             if (colldir1)
             {
                 for (int i = 0; i < nquad1; ++i)
                 {
                     Vmath::Vcopy(nquad2 * numElmt * nmodes0, &wsp1[i], nquad1,
                                  &wsp2[i * nquad2 * numElmt * nmodes0], 1);
                 }
             }
             else
             {
                 Blas::Dgemm('T', 'N', nquad2 * numElmt * nmodes0, nmodes1,
                             nquad1, 1.0, &wsp1[0], nquad1, base1.get(), nquad1,
                             0.0, &wsp2[0], nquad2 * numElmt * nmodes0);
             }
  
             if (numElmt > 1)
             {
                 if (colldir2)
                 {
                     for (int i = 0; i < nquad2; ++i)
                     {
                         Vmath::Vcopy(nmodes0 * nmodes1, &wsp2[i], nquad2,
                                      &output[i * nmodes0 * nmodes1], 1);
                     }
                 }
                 else
                 {
                     Blas::Dgemm('T', 'N', numElmt * nmodes0 * nmodes1, nmodes2,
                                 nquad2, 1.0, &wsp2[0], nquad2, base2.get(),
                                 nquad2, 0.0, &wsp1[0],
                                 numElmt * nmodes0 * nmodes1);
                 }
  
                 for (int i = 0; i < totmodes; ++i)
                 {
                     Vmath::Vcopy(numElmt, &wsp1[i * numElmt], 1, &output[i],
                                  totmodes);
                 }
             }
             else
             {
                 if (colldir2)
                 {
                     for (int i = 0; i < nquad2; ++i)
                     {
                         Vmath::Vcopy(nmodes0 * nmodes1, &wsp2[i], nquad2,
                                      &output[i * nmodes0 * nmodes1], 1);
                     }
                 }
                 else
                 {
                     Blas::Dgemm('T', 'N', numElmt * nmodes0 * nmodes1, nmodes2,
                                 nquad2, 1.0, &wsp2[0], nquad2, base2.get(),
                                 nquad2, 0.0, &output[0],
                                 numElmt * nmodes0 * nmodes1);
                 }
             }
         }
     }
 }

References Blas::Dgemm(), Vmath::Vcopy(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Hex::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Hex::operator()().

◆ operator<()

bool Nektar::Collections::operator<	(	OperatorKey const &	p1,
		OperatorKey const &	p2
	)

Less-than comparison operator for OperatorKey objects.

Definition at line 56 of file Operator.cpp.

 {
     if (std::get<0>(p1) < std::get<0>(p2))
     {
         return true;
     }
     if (std::get<0>(p1) > std::get<0>(p2))
     {
         return false;
     }
     if (std::get<1>(p1) < std::get<1>(p2))
     {
         return true;
     }
     if (std::get<1>(p1) > std::get<1>(p2))
     {
         return false;
     }
     if (std::get<2>(p1) < std::get<2>(p2))
     {
         return true;
     }
     if (std::get<2>(p1) > std::get<2>(p2))
     {
         return false;
     }
  
     if (std::get<3>(p1) < std::get<3>(p2))
     {
         return true;
     }
     if (std::get<3>(p1) > std::get<3>(p2))
     {
         return false;
     }
  
     return false;
 }

◆ operator<<()

std::ostream & Nektar::Collections::operator<<	(	std::ostream &	os,
		OperatorKey const &	p
	)

Stream output operator for OperatorKey objects.

Definition at line 98 of file Operator.cpp.

 {
     os << LibUtilities::ShapeTypeMap[std::get<0>(p)] << ", "
        << OperatorTypeMap[std::get<1>(p)] << ", "
        << ImplementationTypeMap[std::get<2>(p)] << ", "
        << (std::get<3>(p) ? "Nodal" : "Modal");
     return os;
 }

References ImplementationTypeMap, OperatorTypeMap, and CellMLToNektar.cellml_metadata::p.

◆ PrismIProduct()

void Nektar::Collections::PrismIProduct	(	bool	sortTopVert,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 342 of file IProduct.cpp.

 {
     int totmodes = LibUtilities::StdPrismData::getNumberOfCoefficients(
         nmodes0, nmodes1, nmodes2);
     int totpoints = nquad0 * nquad1 * nquad2;
     int cnt;
     int mode, mode1;
  
     Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
  
     Array<OneD, NekDouble> wsp1 =
         wsp + numElmt * nquad2 * (max(nquad0 * nquad1, nmodes0 * nmodes1));
  
     // Perform iproduct  with respect to the  '0' direction
     Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0, nquad0, 1.0,
                 wsp.get(), nquad0, base0.get(), nquad0, 0.0, wsp1.get(),
                 nquad1 * nquad2 * numElmt);
  
     // Perform iproduct  with respect to the  '1' direction
     Blas::Dgemm('T', 'N', nquad2 * numElmt * nmodes0, nmodes1, nquad1, 1.0,
                 wsp1.get(), nquad1, base1.get(), nquad1, 0.0, wsp.get(),
                 nquad2 * numElmt * nmodes0);
  
     // Inner product with respect to the '2' direction (not sure if it would
     // be better to swap loops?)
     mode = mode1 = cnt = 0;
     for (int i = 0; i < nmodes0; ++i)
     {
         cnt = i * nquad2 * numElmt;
         for (int j = 0; j < nmodes1; ++j)
         {
             Blas::Dgemm('T', 'N', nmodes2 - i, numElmt, nquad2, 1.0,
                         base2.get() + mode * nquad2, nquad2,
                         wsp.get() + j * nquad2 * numElmt * nmodes0 + cnt,
                         nquad2, 0.0, output.get() + mode1, totmodes);
             mode1 += nmodes2 - i;
         }
         mode += nmodes2 - i;
     }
  
     // fix for modified basis by splitting top vertex mode
     if (sortTopVertex)
     {
         // top singular vertex
         // ((1+a)/2 components entry into (1+c)/2)
         // Could be made into an mxv if we have specialised base1[1]
         for (int j = 0; j < nmodes1; ++j)
         {
             Blas::Dgemv('T', nquad2, numElmt, 1.0,
                         wsp.get() + j * nquad2 * numElmt * nmodes0 +
                             nquad2 * numElmt,
                         nquad2, base2.get() + nquad2, 1, 1.0,
                         &output[j * nmodes2 + 1], totmodes);
         }
     }
 }

References Blas::Dgemm(), Blas::Dgemv(), Nektar::LibUtilities::StdSegData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Prism::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Prism::operator()().

◆ PyrIProduct()

void Nektar::Collections::PyrIProduct	(	bool	sortTopVert,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 409 of file IProduct.cpp.

 {
     int totmodes = LibUtilities::StdPyrData::getNumberOfCoefficients(
         nmodes0, nmodes1, nmodes2);
     int totpoints = nquad0 * nquad1 * nquad2;
     int cnt;
     int mode, mode1;
  
     ASSERTL1(wsp.size() >=
                  numElmt * (nquad1 * nquad2 * nmodes0 +
                             nquad2 * max(nquad0 * nquad1, nmodes0 * nmodes1)),
              "Insufficient workspace size");
  
     Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
  
     Array<OneD, NekDouble> wsp1 =
         wsp + numElmt * nquad2 * (max(nquad0 * nquad1, nmodes0 * nmodes1));
  
     // Perform iproduct  with respect to the  '0' direction
     Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0, nquad0, 1.0,
                 wsp.get(), nquad0, base0.get(), nquad0, 0.0, wsp1.get(),
                 nquad1 * nquad2 * numElmt);
  
     // Inner product with respect to the '1' direction
     mode = 0;
     for (int i = 0; i < nmodes0; ++i)
     {
         Blas::Dgemm('T', 'N', nquad2 * numElmt, nmodes1, nquad1, 1.0,
                     wsp1.get() + i * nquad1 * nquad2 * numElmt, nquad1,
                     base1.get(), nquad1, 0.0,
                     wsp.get() + mode * nquad2 * numElmt, nquad2 * numElmt);
         mode += nmodes1;
     }
  
     // Inner product with respect to the '2' direction
     mode = mode1 = cnt = 0;
     for (int i = 0; i < nmodes0; ++i)
     {
         for (int j = 0; j < nmodes1; ++j, ++cnt)
         {
             int ijmax = max(i, j);
             Blas::Dgemm('T', 'N', nmodes2 - ijmax, numElmt, nquad2, 1.0,
                         base2.get() + mode * nquad2, nquad2,
                         wsp.get() + cnt * nquad2 * numElmt, nquad2, 0.0,
                         output.get() + mode1, totmodes);
             mode += nmodes2 - ijmax;
             mode1 += nmodes2 - ijmax;
         }
  
         // increment mode in case order1!=order2
         for (int j = nmodes1; j < nmodes2; ++j)
         {
             int ijmax = max(i, j);
             mode += nmodes2 - ijmax;
         }
     }
  
     // fix for modified basis for top singular vertex component
     // Already have evaluated (1+c)/2 (1-b)/2 (1-a)/2
     if (sortTopVertex)
     {
         for (int n = 0; n < numElmt; ++n)
         {
             // add in (1+c)/2 (1+b)/2 component
             output[1 + n * totmodes] +=
                 Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                            &wsp[nquad2 * numElmt + n * nquad2], 1);
  
             // add in (1+c)/2 (1-b)/2 (1+a)/2 component
             output[1 + n * totmodes] +=
                 Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                            &wsp[nquad2 * nmodes1 * numElmt + n * nquad2], 1);
  
             // add in (1+c)/2 (1+b)/2 (1+a)/2 component
             output[1 + n * totmodes] += Blas::Ddot(
                 nquad2, base2.get() + nquad2, 1,
                 &wsp[nquad2 * (nmodes1 + 1) * numElmt + n * nquad2], 1);
         }
     }
 }

References ASSERTL1, Blas::Ddot(), Blas::Dgemm(), Nektar::LibUtilities::StdSegData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Pyr::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Pyr::operator()().

◆ QuadIProduct()

void Nektar::Collections::QuadIProduct	(	bool	colldir0,
		bool	colldir1,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nmodes0,
		int	nmodes1,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 48 of file IProduct.cpp.

 {
     int totpoints = nquad0 * nquad1;
     int totmodes  = nmodes0 * nmodes1;
  
     Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
  
     if (colldir0 && colldir1)
     {
         Vmath::Vcopy(numElmt * totmodes, wsp.get(), 1, output.get(), 1);
     }
     else
     {
         Array<OneD, NekDouble> wsp1 = wsp + max(totpoints, totmodes) * numElmt;
         if (colldir0)
         {
             for (int i = 0; i < nquad0; ++i)
             {
                 Vmath::Vcopy(nquad1 * numElmt, &wsp[i], nquad0,
                              &wsp1[i * nquad1 * numElmt], 1);
             }
         }
         else
         {
             Blas::Dgemm('T', 'N', nquad1 * numElmt, nmodes0, nquad0, 1.0,
                         &wsp[0], nquad0, base0.get(), nquad0, 0.0, &wsp1[0],
                         nquad1 * numElmt);
         }
  
         if (numElmt > 1)
         {
  
             if (colldir1)
             {
                 for (int i = 0; i < nquad1; ++i)
                 {
                     Vmath::Vcopy(numElmt * nmodes0, &wsp1[i], nquad1,
                                  &wsp[i * numElmt * nmodes0], 1);
                 }
             }
             else
             {
  
                 Blas::Dgemm('T', 'N', numElmt * nmodes0, nmodes1, nquad1, 1.0,
                             &wsp1[0], nquad1, base1.get(), nquad1, 0.0, &wsp[0],
                             numElmt * nmodes0);
             }
  
             for (int i = 0; i < totmodes; ++i)
             {
                 Vmath::Vcopy(numElmt, &wsp[i * numElmt], 1, &output[i],
                              totmodes);
             }
         }
         else
         {
             if (colldir1)
             {
                 for (int i = 0; i < nquad1; ++i)
                 {
                     Vmath::Vcopy(numElmt * nmodes0, &wsp1[i], nquad1,
                                  &output[i * numElmt * nmodes0], 1);
                 }
             }
             else
             {
                 Blas::Dgemm('T', 'N', nmodes0, nmodes1, nquad1, 1.0, &wsp1[0],
                             nquad1, base1.get(), nquad1, 0.0, &output[0],
                             nmodes0);
             }
         }
     }
 }

References Blas::Dgemm(), Vmath::Vcopy(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Quad::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Quad::operator()().

◆ SetFixedImpType()

OperatorImpMap Nektar::Collections::SetFixedImpType ( ImplementationType defaultType )

simple Operator Implementation Map generator

Definition at line 124 of file Operator.cpp.

 {
     OperatorImpMap opMap;
  
     for (int i = 0; i < SIZE_OperatorType; ++i)
     {
         opMap[(OperatorType)i] = defaultType;
     }
  
     return opMap;
 }

References SIZE_OperatorType.

◆ TetIProduct()

void Nektar::Collections::TetIProduct	(	bool	sortTopEdge,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 500 of file IProduct.cpp.

 {
     int totmodes = LibUtilities::StdTetData::getNumberOfCoefficients(
         nmodes0, nmodes1, nmodes2);
     int totpoints = nquad0 * nquad1 * nquad2;
     int cnt;
     int mode, mode1;
  
     Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
  
     Array<OneD, NekDouble> wsp1 =
         wsp +
         nquad2 * numElmt *
             (max(nquad0 * nquad1, nmodes0 * (2 * nmodes1 - nmodes0 + 1) / 2));
  
     // Perform iproduct  with respect to the  '0' direction
     Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0, nquad0, 1.0,
                 wsp.get(), nquad0, base0.get(), nquad0, 0.0, wsp1.get(),
                 nquad1 * nquad2 * numElmt);
  
     // Inner product with respect to the '1' direction
     mode = 0;
     for (int i = 0; i < nmodes0; ++i)
     {
         Blas::Dgemm('T', 'N', nquad2 * numElmt, nmodes1 - i, nquad1, 1.0,
                     wsp1.get() + i * nquad1 * nquad2 * numElmt, nquad1,
                     base1.get() + mode * nquad1, nquad1, 0.0,
                     wsp.get() + mode * nquad2 * numElmt, nquad2 * numElmt);
         mode += nmodes1 - i;
     }
  
     // fix for modified basis by splitting top vertex mode
     if (sortTopEdge)
     {
         // base singular vertex and singular edge (1+b)/2
         // ((1+a)/2 components entry into (1+b)/2)
         // Could be made into an mxm if we have specialised base1[1]
         for (int n = 0; n < numElmt; ++n)
         {
             Blas::Dgemv('T', nquad1, nquad2, 1.0,
                         wsp1.get() + numElmt * nquad1 * nquad2 +
                             n * nquad1 * nquad2,
                         nquad1, base1.get() + nquad1, 1, 1.0,
                         wsp.get() + nquad2 * numElmt + n * nquad2, 1);
         }
     }
  
     // Inner product with respect to the '2' direction
     mode = mode1 = cnt = 0;
     for (int i = 0; i < nmodes0; ++i)
     {
         for (int j = 0; j < nmodes1 - i; ++j, ++cnt)
         {
             Blas::Dgemm('T', 'N', nmodes2 - i - j, numElmt, nquad2, 1.0,
                         base2.get() + mode * nquad2, nquad2,
                         wsp.get() + cnt * nquad2 * numElmt, nquad2, 0.0,
                         output.get() + mode1, totmodes);
             mode += nmodes2 - i - j;
             mode1 += nmodes2 - i - j;
         }
  
         // increment mode in case order1!=order2
         mode += (nmodes2 - nmodes1) * (nmodes2 - nmodes1 + 1) / 2;
     }
  
     // fix for modified basis for top singular vertex component
     // Already have evaluated (1+c)/2 (1-b)/2 (1-a)/2
     if (sortTopEdge)
     {
         for (int n = 0; n < numElmt; ++n)
         {
             // add in (1+c)/2 (1+b)/2 component
             output[1 + n * totmodes] +=
                 Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                            &wsp[nquad2 * numElmt + n * nquad2], 1);
  
             // add in (1+c)/2 (1-b)/2 (1+a)/2 component
             output[1 + n * totmodes] +=
                 Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                            &wsp[nquad2 * nmodes1 * numElmt + n * nquad2], 1);
         }
     }
 }

References Blas::Ddot(), Blas::Dgemm(), Blas::Dgemv(), Nektar::LibUtilities::StdSegData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Tet::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Tet::operator()().

◆ TriIProduct()

void Nektar::Collections::TriIProduct	(	bool	sortTopVertex,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nmodes0,
		int	nmodes1,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 131 of file IProduct.cpp.

 {
     int totmodes =
         LibUtilities::StdTriData::getNumberOfCoefficients(nmodes0, nmodes1);
     int totpoints = nquad0 * nquad1;
  
     Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
  
     Array<OneD, NekDouble> wsp1 = wsp + max(totpoints, totmodes) * numElmt;
  
     Blas::Dgemm('T', 'N', nquad1 * numElmt, nmodes0, nquad0, 1.0, &wsp[0],
                 nquad0, base0.get(), nquad0, 0.0, &wsp1[0], nquad1 * numElmt);
  
     int i, mode;
     // Inner product with respect to 'b' direction
     for (mode = i = 0; i < nmodes0; ++i)
     {
         Blas::Dgemm('T', 'N', nmodes1 - i, numElmt, nquad1, 1.0,
                     base1.get() + mode * nquad1, nquad1,
                     wsp1.get() + i * nquad1 * numElmt, nquad1, 0.0,
                     &output[mode], totmodes);
  
         mode += nmodes1 - i;
     }
  
     // fix for modified basis by splitting top vertex mode
     if (sortTopVertex)
     {
         Blas::Dgemv('T', nquad1, numElmt, 1.0, wsp1.get() + nquad1 * numElmt,
                     nquad1, base1.get() + nquad1, 1, 1.0, &output[1], totmodes);
     }
 }

References Blas::Dgemm(), Blas::Dgemv(), Nektar::LibUtilities::StdSegData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Tri::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Tri::operator()().

Variable Documentation

◆ GeomDataNull

CoalescedGeomDataSharedPtr Nektar::Collections::GeomDataNull

static

Definition at line 94 of file CoalescedGeomData.h.

◆ ImplementationTypeMap

const char* const Nektar::Collections::ImplementationTypeMap[]

Initial value:

= {"NoImplementationType",
                                             "NoCollection",
                                             "IterPerExp",
                                             "StdMat",
                                             "SumFac",
                                             "MatrixFree"}

Definition at line 94 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::CollectionOptimisation(), operator<<(), Nektar::Collections::CollectionOptimisation::ReadCollOps(), and Nektar::Collections::CollectionOptimisation::UpdateOptFile().

◆ ImplementationTypeMap1

const char* const Nektar::Collections::ImplementationTypeMap1[]

Initial value:

= {
    "NoImplementationType",
    "IterLocExp", 
    "IterStdExp", 
    "StdMat    ",
    "SumFac    ",
    "MatFree   " 
}

Definition at line 101 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::SetWithTimings().

◆ OperatorTypeMap

const char* const Nektar::Collections::OperatorTypeMap[]

Initial value:

= {"BwdTrans", "Helmholtz",
                                       "IProductWRTBase",
                                       "IProductWRTDerivBase", "PhysDeriv"}

Definition at line 76 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::CollectionOptimisation(), Nektar::Collections::Collection::Initialise(), operator<<(), Nektar::Collections::CollectionOptimisation::ReadCollOps(), and Nektar::Collections::CollectionOptimisation::UpdateOptFile().

◆ OperatorTypeMap1

const char* const Nektar::Collections::OperatorTypeMap1[]

Initial value:

= {"BwdTrans", "Helmholtz", "IPWrtBase",

"IPWrtDBase", "PhysDeriv "}

Definition at line 80 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::SetWithTimings().

Classes

Typedefs

Enumerations

Functions

Variables

Typedef Documentation

◆ CoalescedGeomDataSharedPtr

◆ CollectionVector

◆ CollectionVectorSharedPtr

◆ ExpansionIsNodal

◆ OperatorFactory

◆ OperatorImpMap

◆ OperatorKey

◆ OperatorSharedPtr

◆ vec_t

◆ VecVec_t

Enumeration Type Documentation

◆ GeomData

◆ ImplementationType

◆ OperatorType

Function Documentation

◆ GetOperatorFactory()

◆ HexIProduct()

◆ operator<()

◆ operator<<()

◆ PrismIProduct()

◆ PyrIProduct()

◆ QuadIProduct()

◆ SetFixedImpType()

◆ TetIProduct()

◆ TriIProduct()

Variable Documentation

◆ GeomDataNull

◆ ImplementationTypeMap

◆ ImplementationTypeMap1

◆ OperatorTypeMap

◆ OperatorTypeMap1