Classes
class	BwdTrans_IterPerExp
	Backward transform operator using default StdRegions operator. More...

class	BwdTrans_MatrixFree
	Backward transform operator using matrix free operators. More...

class	BwdTrans_NoCollection
	Backward transform operator using LocalRegions implementation. More...

class	BwdTrans_StdMat
	Backward transform operator using standard matrix approach. More...

class	BwdTrans_SumFac_Hex
	Backward transform operator using sum-factorisation (Hex) More...

class	BwdTrans_SumFac_Prism
	Backward transform operator using sum-factorisation (Prism) More...

class	BwdTrans_SumFac_Pyr
	Backward transform operator using sum-factorisation (Pyr) More...

class	BwdTrans_SumFac_Quad
	Backward transform operator using sum-factorisation (Quad) More...

class	BwdTrans_SumFac_Seg
	Backward transform operator using sum-factorisation (Segment) More...

class	BwdTrans_SumFac_Tet
	Backward transform operator using sum-factorisation (Tet) More...

class	BwdTrans_SumFac_Tri
	Backward transform operator using sum-factorisation (Tri) More...

class	CoalescedGeomData

class	Collection
	Collection. More...

class	CollectionOptimisation

class	Helmholtz_IterPerExp
	Helmholtz operator using LocalRegions implementation. More...

class	Helmholtz_MatrixFree
	Helmholtz operator using matrix free operators. More...

class	Helmholtz_NoCollection
	Helmholtz operator using LocalRegions implementation. More...

class	IProductWRTBase_IterPerExp
	Inner product operator using element-wise operation. More...

class	IProductWRTBase_MatrixFree
	Inner product operator using operator using matrix free operators. More...

class	IProductWRTBase_NoCollection
	Inner product operator using original MultiRegions implementation. More...

class	IProductWRTBase_StdMat
	Inner product operator using standard matrix approach. More...

class	IProductWRTBase_SumFac_Hex
	Inner Product operator using sum-factorisation (Hex) More...

class	IProductWRTBase_SumFac_Prism
	Inner Product operator using sum-factorisation (Prism) More...

class	IProductWRTBase_SumFac_Pyr
	Inner Product operator using sum-factorisation (Pyr) More...

class	IProductWRTBase_SumFac_Quad
	Inner product operator using sum-factorisation (Quad) More...

class	IProductWRTBase_SumFac_Seg
	Inner product operator using sum-factorisation (Segment) More...

class	IProductWRTBase_SumFac_Tet
	Inner product operator using sum-factorisation (Tet) More...

class	IProductWRTBase_SumFac_Tri
	Inner product operator using sum-factorisation (Tri) More...

class	IProductWRTDerivBase_IterPerExp
	Inner product WRT deriv base operator using element-wise operation. More...

class	IProductWRTDerivBase_MatrixFree
	Inner product operator using operator using matrix free operators. More...

class	IProductWRTDerivBase_NoCollection
	Inner product WRT deriv base operator using LocalRegions implementation. More...

class	IProductWRTDerivBase_StdMat
	Inner product WRT deriv base operator using standard matrix approach. More...

class	IProductWRTDerivBase_SumFac_Hex
	Inner product WRT deriv base operator using sum-factorisation (Hex) More...

class	IProductWRTDerivBase_SumFac_Prism
	Inner product WRT deriv base operator using sum-factorisation (Prism) More...

class	IProductWRTDerivBase_SumFac_Pyr
	Inner product WRT deriv base operator using sum-factorisation (Pyr) More...

class	IProductWRTDerivBase_SumFac_Quad
	Inner product WRT deriv base operator using sum-factorisation (Quad) More...

class	IProductWRTDerivBase_SumFac_Seg
	Inner product WRT deriv base operator using sum-factorisation (Segment) More...

class	IProductWRTDerivBase_SumFac_Tet
	Inner product WRT deriv base operator using sum-factorisation (Tet) More...

class	IProductWRTDerivBase_SumFac_Tri
	Inner product WRT deriv base operator using sum-factorisation (Tri) More...

class	MatrixFreeBase

class	MatrixFreeMultiInOneOut

class	MatrixFreeOneInMultiOut

class	MatrixFreeOneInOneOut

class	Operator
	Base class for operators on a collection of elements. More...

class	OpImpTimingKey

class	PhysDeriv_IterPerExp
	Phys deriv operator using element-wise operation. More...

class	PhysDeriv_MatrixFree
	Phys deriv operator using matrix free operators. More...

class	PhysDeriv_NoCollection
	Phys deriv operator using original LocalRegions implementation. More...

class	PhysDeriv_StdMat
	Phys deriv operator using standard matrix approach. More...

class	PhysDeriv_SumFac_Hex
	Phys deriv operator using sum-factorisation (Hex) More...

class	PhysDeriv_SumFac_Prism
	Phys deriv operator using sum-factorisation (Prism) More...

class	PhysDeriv_SumFac_Pyr
	Phys deriv operator using sum-factorisation (Pyramid) More...

class	PhysDeriv_SumFac_Quad
	Phys deriv operator using sum-factorisation (Quad) More...

class	PhysDeriv_SumFac_Seg
	Phys deriv operator using sum-factorisation (Segment) More...

class	PhysDeriv_SumFac_Tet
	Phys deriv operator using sum-factorisation (Tet) More...

class	PhysDeriv_SumFac_Tri
	Phys deriv operator using sum-factorisation (Tri) More...

Typedefs
using	vec_t = simd< NekDouble >

typedef std::vector< vec_t, tinysimd::allocator< vec_t > >	VecVec_t

typedef std::shared_ptr< CoalescedGeomData >	CoalescedGeomDataSharedPtr

typedef std::vector< Collection >	CollectionVector

typedef std::shared_ptr< CollectionVector >	CollectionVectorSharedPtr

typedef bool	ExpansionIsNodal

typedef std::map< OperatorType, ImplementationType >	OperatorImpMap

typedef std::shared_ptr< Operator >	OperatorSharedPtr
	Shared pointer to an Operator object. More...

typedef std::tuple< LibUtilities::ShapeType, OperatorType, ImplementationType, ExpansionIsNodal >	OperatorKey
	Key for describing an Operator. More...

typedef Nektar::LibUtilities::NekFactory< OperatorKey, Operator, std::vector< StdRegions::StdExpansionSharedPtr >, CoalescedGeomDataSharedPtr, StdRegions::FactorMap >	OperatorFactory
	Operator factory definition. More...

Enumerations
enum	GeomData { eJac , eJacWithStdWeights , eDerivFactors }

enum	OperatorType { eBwdTrans , eHelmholtz , eIProductWRTBase , eIProductWRTDerivBase , ePhysDeriv , SIZE_OperatorType }

enum	ImplementationType { eNoImpType , eNoCollection , eIterPerExp , eStdMat , eSumFac , eMatrixFree , SIZE_ImplementationType }

Functions
void	QuadIProduct (bool colldir0, bool colldir1, int numElmt, int nquad0, int nquad1, int nmodes0, int nmodes1, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	TriIProduct (bool sortTopVertex, int numElmt, int nquad0, int nquad1, int nmodes0, int nmodes1, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	HexIProduct (bool colldir0, bool colldir1, bool colldir2, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	PrismIProduct (bool sortTopVert, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	PyrIProduct (bool sortTopVert, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

void	TetIProduct (bool sortTopEdge, int numElmt, int nquad0, int nquad1, int nquad2, int nmodes0, int nmodes1, int nmodes2, const Array< OneD, const NekDouble > &base0, const Array< OneD, const NekDouble > &base1, const Array< OneD, const NekDouble > &base2, const Array< OneD, const NekDouble > &jac, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp)

bool	operator< (OperatorKey const &p1, OperatorKey const &p2)
	Less-than comparison operator for OperatorKey objects. More...

std::ostream &	operator<< (std::ostream &os, OperatorKey const &p)
	Stream output operator for OperatorKey objects. More...

OperatorFactory &	GetOperatorFactory ()
	Returns the singleton Operator factory object. More...

OperatorImpMap	SetFixedImpType (ImplementationType defaultType)
	simple Operator Implementation Map generator More...

Variables
static CoalescedGeomDataSharedPtr	GeomDataNull

const char *const	OperatorTypeMap []

const char *const	OperatorTypeMap1 []

const char *const	ImplementationTypeMap []

const char *const	ImplementationTypeMap1 []

Typedef Documentation

◆ CoalescedGeomDataSharedPtr

typedef std::shared_ptr< CoalescedGeomData > Nektar::Collections::CoalescedGeomDataSharedPtr

Definition at line 92 of file CoalescedGeomData.h.

◆ CollectionVector

typedef std::vector<Collection> Nektar::Collections::CollectionVector

Definition at line 110 of file Collection.h.

◆ CollectionVectorSharedPtr

typedef std::shared_ptr<CollectionVector> Nektar::Collections::CollectionVectorSharedPtr

Definition at line 111 of file Collection.h.

◆ ExpansionIsNodal

typedef bool Nektar::Collections::ExpansionIsNodal

Definition at line 110 of file Operator.h.

◆ OperatorFactory

typedef Nektar::LibUtilities::NekFactory< OperatorKey, Operator, std::vector<StdRegions::StdExpansionSharedPtr>, CoalescedGeomDataSharedPtr, StdRegions::FactorMap> Nektar::Collections::OperatorFactory

Operator factory definition.

Definition at line 189 of file Operator.h.

◆ OperatorImpMap

typedef std::map<OperatorType, ImplementationType> Nektar::Collections::OperatorImpMap

Definition at line 112 of file Operator.h.

◆ OperatorKey

typedef std::tuple<LibUtilities::ShapeType, OperatorType, ImplementationType, ExpansionIsNodal> Nektar::Collections::OperatorKey

Key for describing an Operator.

Definition at line 177 of file Operator.h.

◆ OperatorSharedPtr

typedef std::shared_ptr<Operator> Nektar::Collections::OperatorSharedPtr

Shared pointer to an Operator object.

Definition at line 172 of file Operator.h.

◆ vec_t

using Nektar::Collections::vec_t = typedef simd<NekDouble>

Definition at line 49 of file CoalescedGeomData.h.

◆ VecVec_t

typedef std::vector<vec_t, tinysimd::allocator<vec_t> > Nektar::Collections::VecVec_t

Definition at line 50 of file CoalescedGeomData.h.

Enumeration Type Documentation

◆ GeomData

enum Nektar::Collections::GeomData

Enumerator
eJac
eJacWithStdWeights
eDerivFactors

Definition at line 52 of file CoalescedGeomData.h.

{
    eJac,
    eJacWithStdWeights,
    eDerivFactors
};

◆ ImplementationType

enum Nektar::Collections::ImplementationType

Enumerator
eNoImpType
eNoCollection
eIterPerExp
eStdMat
eSumFac
eMatrixFree
SIZE_ImplementationType

Definition at line 83 of file Operator.h.

{
    eNoImpType,
    eNoCollection,
    eIterPerExp,
    eStdMat,
    eSumFac,
    eMatrixFree,
    SIZE_ImplementationType
};

◆ OperatorType

enum Nektar::Collections::OperatorType

Enumerator
eBwdTrans
eHelmholtz
eIProductWRTBase
eIProductWRTDerivBase
ePhysDeriv
SIZE_OperatorType

Definition at line 66 of file Operator.h.

{
    eBwdTrans,
    eHelmholtz,
    eIProductWRTBase,
    eIProductWRTDerivBase,
    ePhysDeriv,
    SIZE_OperatorType
};

Function Documentation

◆ GetOperatorFactory()

OperatorFactory & Nektar::Collections::GetOperatorFactory ( )

Returns the singleton Operator factory object.

Definition at line 117 of file Operator.cpp.

{
    static OperatorFactory instance;
    return instance;
}

Referenced by Nektar::Collections::BwdTrans_MatrixFree::BwdTrans_MatrixFree(), Nektar::Collections::Helmholtz_MatrixFree::Helmholtz_MatrixFree(), Nektar::Collections::Collection::Initialise(), Nektar::Collections::IProductWRTBase_MatrixFree::IProductWRTBase_MatrixFree(), Nektar::Collections::IProductWRTDerivBase_MatrixFree::IProductWRTDerivBase_MatrixFree(), Nektar::Collections::PhysDeriv_MatrixFree::PhysDeriv_MatrixFree(), and Nektar::Collections::CollectionOptimisation::SetWithTimings().

◆ HexIProduct()

void Nektar::Collections::HexIProduct	(	bool	colldir0,
		bool	colldir1,
		bool	colldir2,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 173 of file IProduct.cpp.

{
    int totmodes  = nmodes0 * nmodes1 * nmodes2;
    int totpoints = nquad0 * nquad1 * nquad2;
 
    if (colldir0 && colldir1 && colldir2)
    {
 
        Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, output, 1);
    }
    else
    {
        Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
 
        // Assign second half of workspace for 2nd DGEMM operation.
        Array<OneD, NekDouble> wsp1 = wsp + totpoints * numElmt;
 
        // note sure what criterion we should use to swap around these
        // strategies
        if (numElmt < nmodes0 || 1)
        {
            Array<OneD, NekDouble> wsp2 = wsp1 + nmodes0 * nquad1 * nquad2;
 
            // loop over elements
            for (int n = 0; n < numElmt; ++n)
            {
                if (colldir0)
                {
 
                    for (int i = 0; i < nmodes0; ++i)
                    {
                        Vmath::Vcopy(nquad1 * nquad2, &wsp[n * totpoints] + i,
                                     nquad0, wsp1.get() + nquad1 * nquad2 * i,
                                     1);
                    }
                }
                else
                {
                    Blas::Dgemm('T', 'N', nquad1 * nquad2, nmodes0, nquad0, 1.0,
                                &wsp[n * totpoints], nquad0, base0.get(),
                                nquad0, 0.0, wsp1.get(), nquad1 * nquad2);
                }
 
                if (colldir1)
                {
                    // reshuffle data for next operation.
                    for (int i = 0; i < nmodes1; ++i)
                    {
                        Vmath::Vcopy(nquad2 * nmodes0, wsp1.get() + i, nquad1,
                                     wsp2.get() + nquad2 * nmodes0 * i, 1);
                    }
                }
                else
                {
                    Blas::Dgemm('T', 'N', nquad2 * nmodes0, nmodes1, nquad1,
                                1.0, wsp1.get(), nquad1, base1.get(), nquad1,
                                0.0, wsp2.get(), nquad2 * nmodes0);
                }
 
                if (colldir2)
                {
                    // reshuffle data for next operation.
                    for (int i = 0; i < nmodes2; ++i)
                    {
                        Vmath::Vcopy(
                            nmodes0 * nmodes1, wsp2.get() + i, nquad2,
                            &output[n * totmodes] + nmodes0 * nmodes1 * i, 1);
                    }
                }
                else
                {
                    Blas::Dgemm('T', 'N', nmodes0 * nmodes1, nmodes2, nquad2,
                                1.0, wsp2.get(), nquad2, base2.get(), nquad2,
                                0.0, &output[n * totmodes], nmodes0 * nmodes1);
                }
            }
        }
        else
        {
            Array<OneD, NekDouble> wsp2 =
                wsp1 + numElmt * (max(totpoints, totmodes));
 
            if (colldir0)
            {
                for (int i = 0; i < nquad0; ++i)
                {
                    Vmath::Vcopy(nquad1 * nquad2 * numElmt, &wsp[i], nquad0,
                                 &wsp1[i * nquad1 * nquad2 * numElmt], 1);
                }
            }
            else
            {
                // large degmm but copy at end.
                Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0,
                            nquad0, 1.0, &wsp[0], nquad0, base0.get(), nquad0,
                            0.0, &wsp1[0], nquad1 * nquad2 * numElmt);
            }
 
            if (colldir1)
            {
                for (int i = 0; i < nquad1; ++i)
                {
                    Vmath::Vcopy(nquad2 * numElmt * nmodes0, &wsp1[i], nquad1,
                                 &wsp2[i * nquad2 * numElmt * nmodes0], 1);
                }
            }
            else
            {
                Blas::Dgemm('T', 'N', nquad2 * numElmt * nmodes0, nmodes1,
                            nquad1, 1.0, &wsp1[0], nquad1, base1.get(), nquad1,
                            0.0, &wsp2[0], nquad2 * numElmt * nmodes0);
            }
 
            if (numElmt > 1)
            {
                if (colldir2)
                {
                    for (int i = 0; i < nquad2; ++i)
                    {
                        Vmath::Vcopy(nmodes0 * nmodes1, &wsp2[i], nquad2,
                                     &output[i * nmodes0 * nmodes1], 1);
                    }
                }
                else
                {
                    Blas::Dgemm('T', 'N', numElmt * nmodes0 * nmodes1, nmodes2,
                                nquad2, 1.0, &wsp2[0], nquad2, base2.get(),
                                nquad2, 0.0, &wsp1[0],
                                numElmt * nmodes0 * nmodes1);
                }
 
                for (int i = 0; i < totmodes; ++i)
                {
                    Vmath::Vcopy(numElmt, &wsp1[i * numElmt], 1, &output[i],
                                 totmodes);
                }
            }
            else
            {
                if (colldir2)
                {
                    for (int i = 0; i < nquad2; ++i)
                    {
                        Vmath::Vcopy(nmodes0 * nmodes1, &wsp2[i], nquad2,
                                     &output[i * nmodes0 * nmodes1], 1);
                    }
                }
                else
                {
                    Blas::Dgemm('T', 'N', numElmt * nmodes0 * nmodes1, nmodes2,
                                nquad2, 1.0, &wsp2[0], nquad2, base2.get(),
                                nquad2, 0.0, &output[0],
                                numElmt * nmodes0 * nmodes1);
                }
            }
        }
    }
}

References Blas::Dgemm(), Vmath::Vcopy(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Hex::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Hex::operator()().

◆ operator<()

bool Nektar::Collections::operator<	(	OperatorKey const &	p1,
		OperatorKey const &	p2
	)

Less-than comparison operator for OperatorKey objects.

Definition at line 56 of file Operator.cpp.

{
    if (std::get<0>(p1) < std::get<0>(p2))
    {
        return true;
    }
    if (std::get<0>(p1) > std::get<0>(p2))
    {
        return false;
    }
    if (std::get<1>(p1) < std::get<1>(p2))
    {
        return true;
    }
    if (std::get<1>(p1) > std::get<1>(p2))
    {
        return false;
    }
    if (std::get<2>(p1) < std::get<2>(p2))
    {
        return true;
    }
    if (std::get<2>(p1) > std::get<2>(p2))
    {
        return false;
    }
 
    if (std::get<3>(p1) < std::get<3>(p2))
    {
        return true;
    }
    if (std::get<3>(p1) > std::get<3>(p2))
    {
        return false;
    }
 
    return false;
}

◆ operator<<()

std::ostream & Nektar::Collections::operator<<	(	std::ostream &	os,
		OperatorKey const &	p
	)

Stream output operator for OperatorKey objects.

Definition at line 98 of file Operator.cpp.

{
    os << LibUtilities::ShapeTypeMap[std::get<0>(p)] << ", "
       << OperatorTypeMap[std::get<1>(p)] << ", "
       << ImplementationTypeMap[std::get<2>(p)] << ", "
       << (std::get<3>(p) ? "Nodal" : "Modal");
    return os;
}

References ImplementationTypeMap, OperatorTypeMap, and CellMLToNektar.cellml_metadata::p.

◆ PrismIProduct()

void Nektar::Collections::PrismIProduct	(	bool	sortTopVert,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 342 of file IProduct.cpp.

{
    int totmodes = LibUtilities::StdPrismData::getNumberOfCoefficients(
        nmodes0, nmodes1, nmodes2);
    int totpoints = nquad0 * nquad1 * nquad2;
    int cnt;
    int mode, mode1;
 
    Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
 
    Array<OneD, NekDouble> wsp1 =
        wsp + numElmt * nquad2 * (max(nquad0 * nquad1, nmodes0 * nmodes1));
 
    // Perform iproduct  with respect to the  '0' direction
    Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0, nquad0, 1.0,
                wsp.get(), nquad0, base0.get(), nquad0, 0.0, wsp1.get(),
                nquad1 * nquad2 * numElmt);
 
    // Perform iproduct  with respect to the  '1' direction
    Blas::Dgemm('T', 'N', nquad2 * numElmt * nmodes0, nmodes1, nquad1, 1.0,
                wsp1.get(), nquad1, base1.get(), nquad1, 0.0, wsp.get(),
                nquad2 * numElmt * nmodes0);
 
    // Inner product with respect to the '2' direction (not sure if it would
    // be better to swap loops?)
    mode = mode1 = cnt = 0;
    for (int i = 0; i < nmodes0; ++i)
    {
        cnt = i * nquad2 * numElmt;
        for (int j = 0; j < nmodes1; ++j)
        {
            Blas::Dgemm('T', 'N', nmodes2 - i, numElmt, nquad2, 1.0,
                        base2.get() + mode * nquad2, nquad2,
                        wsp.get() + j * nquad2 * numElmt * nmodes0 + cnt,
                        nquad2, 0.0, output.get() + mode1, totmodes);
            mode1 += nmodes2 - i;
        }
        mode += nmodes2 - i;
    }
 
    // fix for modified basis by splitting top vertex mode
    if (sortTopVertex)
    {
        // top singular vertex
        // ((1+a)/2 components entry into (1+c)/2)
        // Could be made into an mxv if we have specialised base1[1]
        for (int j = 0; j < nmodes1; ++j)
        {
            Blas::Dgemv('T', nquad2, numElmt, 1.0,
                        wsp.get() + j * nquad2 * numElmt * nmodes0 +
                            nquad2 * numElmt,
                        nquad2, base2.get() + nquad2, 1, 1.0,
                        &output[j * nmodes2 + 1], totmodes);
        }
    }
}

References Blas::Dgemm(), Blas::Dgemv(), Nektar::LibUtilities::StdPrismData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Prism::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Prism::operator()().

◆ PyrIProduct()

void Nektar::Collections::PyrIProduct	(	bool	sortTopVert,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 409 of file IProduct.cpp.

{
    int totmodes = LibUtilities::StdPyrData::getNumberOfCoefficients(
        nmodes0, nmodes1, nmodes2);
    int totpoints = nquad0 * nquad1 * nquad2;
    int cnt;
    int mode, mode1;
 
    ASSERTL1(wsp.size() >=
                 numElmt * (nquad1 * nquad2 * nmodes0 +
                            nquad2 * max(nquad0 * nquad1, nmodes0 * nmodes1)),
             "Insufficient workspace size");
 
    Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
 
    Array<OneD, NekDouble> wsp1 =
        wsp + numElmt * nquad2 * (max(nquad0 * nquad1, nmodes0 * nmodes1));
 
    // Perform iproduct  with respect to the  '0' direction
    Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0, nquad0, 1.0,
                wsp.get(), nquad0, base0.get(), nquad0, 0.0, wsp1.get(),
                nquad1 * nquad2 * numElmt);
 
    // Inner product with respect to the '1' direction
    mode = 0;
    for (int i = 0; i < nmodes0; ++i)
    {
        Blas::Dgemm('T', 'N', nquad2 * numElmt, nmodes1, nquad1, 1.0,
                    wsp1.get() + i * nquad1 * nquad2 * numElmt, nquad1,
                    base1.get(), nquad1, 0.0,
                    wsp.get() + mode * nquad2 * numElmt, nquad2 * numElmt);
        mode += nmodes1;
    }
 
    // Inner product with respect to the '2' direction
    mode = mode1 = cnt = 0;
    for (int i = 0; i < nmodes0; ++i)
    {
        for (int j = 0; j < nmodes1; ++j, ++cnt)
        {
            int ijmax = max(i, j);
            Blas::Dgemm('T', 'N', nmodes2 - ijmax, numElmt, nquad2, 1.0,
                        base2.get() + mode * nquad2, nquad2,
                        wsp.get() + cnt * nquad2 * numElmt, nquad2, 0.0,
                        output.get() + mode1, totmodes);
            mode += nmodes2 - ijmax;
            mode1 += nmodes2 - ijmax;
        }
 
        // increment mode in case order1!=order2
        for (int j = nmodes1; j < nmodes2; ++j)
        {
            int ijmax = max(i, j);
            mode += nmodes2 - ijmax;
        }
    }
 
    // fix for modified basis for top singular vertex component
    // Already have evaluated (1+c)/2 (1-b)/2 (1-a)/2
    if (sortTopVertex)
    {
        for (int n = 0; n < numElmt; ++n)
        {
            // add in (1+c)/2 (1+b)/2 component
            output[1 + n * totmodes] +=
                Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                           &wsp[nquad2 * numElmt + n * nquad2], 1);
 
            // add in (1+c)/2 (1-b)/2 (1+a)/2 component
            output[1 + n * totmodes] +=
                Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                           &wsp[nquad2 * nmodes1 * numElmt + n * nquad2], 1);
 
            // add in (1+c)/2 (1+b)/2 (1+a)/2 component
            output[1 + n * totmodes] += Blas::Ddot(
                nquad2, base2.get() + nquad2, 1,
                &wsp[nquad2 * (nmodes1 + 1) * numElmt + n * nquad2], 1);
        }
    }
}

References ASSERTL1, Blas::Ddot(), Blas::Dgemm(), Nektar::LibUtilities::StdPyrData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Pyr::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Pyr::operator()().

◆ QuadIProduct()

void Nektar::Collections::QuadIProduct	(	bool	colldir0,
		bool	colldir1,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nmodes0,
		int	nmodes1,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 48 of file IProduct.cpp.

{
    int totpoints = nquad0 * nquad1;
    int totmodes  = nmodes0 * nmodes1;
 
    Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
 
    if (colldir0 && colldir1)
    {
        Vmath::Vcopy(numElmt * totmodes, wsp.get(), 1, output.get(), 1);
    }
    else
    {
        Array<OneD, NekDouble> wsp1 = wsp + max(totpoints, totmodes) * numElmt;
        if (colldir0)
        {
            for (int i = 0; i < nquad0; ++i)
            {
                Vmath::Vcopy(nquad1 * numElmt, &wsp[i], nquad0,
                             &wsp1[i * nquad1 * numElmt], 1);
            }
        }
        else
        {
            Blas::Dgemm('T', 'N', nquad1 * numElmt, nmodes0, nquad0, 1.0,
                        &wsp[0], nquad0, base0.get(), nquad0, 0.0, &wsp1[0],
                        nquad1 * numElmt);
        }
 
        if (numElmt > 1)
        {
 
            if (colldir1)
            {
                for (int i = 0; i < nquad1; ++i)
                {
                    Vmath::Vcopy(numElmt * nmodes0, &wsp1[i], nquad1,
                                 &wsp[i * numElmt * nmodes0], 1);
                }
            }
            else
            {
 
                Blas::Dgemm('T', 'N', numElmt * nmodes0, nmodes1, nquad1, 1.0,
                            &wsp1[0], nquad1, base1.get(), nquad1, 0.0, &wsp[0],
                            numElmt * nmodes0);
            }
 
            for (int i = 0; i < totmodes; ++i)
            {
                Vmath::Vcopy(numElmt, &wsp[i * numElmt], 1, &output[i],
                             totmodes);
            }
        }
        else
        {
            if (colldir1)
            {
                for (int i = 0; i < nquad1; ++i)
                {
                    Vmath::Vcopy(numElmt * nmodes0, &wsp1[i], nquad1,
                                 &output[i * numElmt * nmodes0], 1);
                }
            }
            else
            {
                Blas::Dgemm('T', 'N', nmodes0, nmodes1, nquad1, 1.0, &wsp1[0],
                            nquad1, base1.get(), nquad1, 0.0, &output[0],
                            nmodes0);
            }
        }
    }
}

References Blas::Dgemm(), Vmath::Vcopy(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Quad::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Quad::operator()().

◆ SetFixedImpType()

OperatorImpMap Nektar::Collections::SetFixedImpType ( ImplementationType defaultType )

simple Operator Implementation Map generator

Definition at line 124 of file Operator.cpp.

{
    OperatorImpMap opMap;
 
    for (int i = 0; i < SIZE_OperatorType; ++i)
    {
        opMap[(OperatorType)i] = defaultType;
    }
 
    return opMap;
}

References SIZE_OperatorType.

◆ TetIProduct()

void Nektar::Collections::TetIProduct	(	bool	sortTopEdge,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nquad2,
		int	nmodes0,
		int	nmodes1,
		int	nmodes2,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	base2,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 500 of file IProduct.cpp.

{
    int totmodes = LibUtilities::StdTetData::getNumberOfCoefficients(
        nmodes0, nmodes1, nmodes2);
    int totpoints = nquad0 * nquad1 * nquad2;
    int cnt;
    int mode, mode1;
 
    Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
 
    Array<OneD, NekDouble> wsp1 =
        wsp +
        nquad2 * numElmt *
            (max(nquad0 * nquad1, nmodes0 * (2 * nmodes1 - nmodes0 + 1) / 2));
 
    // Perform iproduct  with respect to the  '0' direction
    Blas::Dgemm('T', 'N', nquad1 * nquad2 * numElmt, nmodes0, nquad0, 1.0,
                wsp.get(), nquad0, base0.get(), nquad0, 0.0, wsp1.get(),
                nquad1 * nquad2 * numElmt);
 
    // Inner product with respect to the '1' direction
    mode = 0;
    for (int i = 0; i < nmodes0; ++i)
    {
        Blas::Dgemm('T', 'N', nquad2 * numElmt, nmodes1 - i, nquad1, 1.0,
                    wsp1.get() + i * nquad1 * nquad2 * numElmt, nquad1,
                    base1.get() + mode * nquad1, nquad1, 0.0,
                    wsp.get() + mode * nquad2 * numElmt, nquad2 * numElmt);
        mode += nmodes1 - i;
    }
 
    // fix for modified basis by splitting top vertex mode
    if (sortTopEdge)
    {
        // base singular vertex and singular edge (1+b)/2
        // ((1+a)/2 components entry into (1+b)/2)
        // Could be made into an mxm if we have specialised base1[1]
        for (int n = 0; n < numElmt; ++n)
        {
            Blas::Dgemv('T', nquad1, nquad2, 1.0,
                        wsp1.get() + numElmt * nquad1 * nquad2 +
                            n * nquad1 * nquad2,
                        nquad1, base1.get() + nquad1, 1, 1.0,
                        wsp.get() + nquad2 * numElmt + n * nquad2, 1);
        }
    }
 
    // Inner product with respect to the '2' direction
    mode = mode1 = cnt = 0;
    for (int i = 0; i < nmodes0; ++i)
    {
        for (int j = 0; j < nmodes1 - i; ++j, ++cnt)
        {
            Blas::Dgemm('T', 'N', nmodes2 - i - j, numElmt, nquad2, 1.0,
                        base2.get() + mode * nquad2, nquad2,
                        wsp.get() + cnt * nquad2 * numElmt, nquad2, 0.0,
                        output.get() + mode1, totmodes);
            mode += nmodes2 - i - j;
            mode1 += nmodes2 - i - j;
        }
 
        // increment mode in case order1!=order2
        mode += (nmodes2 - nmodes1) * (nmodes2 - nmodes1 + 1) / 2;
    }
 
    // fix for modified basis for top singular vertex component
    // Already have evaluated (1+c)/2 (1-b)/2 (1-a)/2
    if (sortTopEdge)
    {
        for (int n = 0; n < numElmt; ++n)
        {
            // add in (1+c)/2 (1+b)/2 component
            output[1 + n * totmodes] +=
                Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                           &wsp[nquad2 * numElmt + n * nquad2], 1);
 
            // add in (1+c)/2 (1-b)/2 (1+a)/2 component
            output[1 + n * totmodes] +=
                Blas::Ddot(nquad2, base2.get() + nquad2, 1,
                           &wsp[nquad2 * nmodes1 * numElmt + n * nquad2], 1);
        }
    }
}

References Blas::Ddot(), Blas::Dgemm(), Blas::Dgemv(), Nektar::LibUtilities::StdTetData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Tet::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Tet::operator()().

◆ TriIProduct()

void Nektar::Collections::TriIProduct	(	bool	sortTopVertex,
		int	numElmt,
		int	nquad0,
		int	nquad1,
		int	nmodes0,
		int	nmodes1,
		const Array< OneD, const NekDouble > &	base0,
		const Array< OneD, const NekDouble > &	base1,
		const Array< OneD, const NekDouble > &	jac,
		const Array< OneD, const NekDouble > &	input,
		Array< OneD, NekDouble > &	output,
		Array< OneD, NekDouble > &	wsp
	)

Definition at line 131 of file IProduct.cpp.

{
    int totmodes =
        LibUtilities::StdTriData::getNumberOfCoefficients(nmodes0, nmodes1);
    int totpoints = nquad0 * nquad1;
 
    Vmath::Vmul(numElmt * totpoints, jac, 1, input, 1, wsp, 1);
 
    Array<OneD, NekDouble> wsp1 = wsp + max(totpoints, totmodes) * numElmt;
 
    Blas::Dgemm('T', 'N', nquad1 * numElmt, nmodes0, nquad0, 1.0, &wsp[0],
                nquad0, base0.get(), nquad0, 0.0, &wsp1[0], nquad1 * numElmt);
 
    int i, mode;
    // Inner product with respect to 'b' direction
    for (mode = i = 0; i < nmodes0; ++i)
    {
        Blas::Dgemm('T', 'N', nmodes1 - i, numElmt, nquad1, 1.0,
                    base1.get() + mode * nquad1, nquad1,
                    wsp1.get() + i * nquad1 * numElmt, nquad1, 0.0,
                    &output[mode], totmodes);
 
        mode += nmodes1 - i;
    }
 
    // fix for modified basis by splitting top vertex mode
    if (sortTopVertex)
    {
        Blas::Dgemv('T', nquad1, numElmt, 1.0, wsp1.get() + nquad1 * numElmt,
                    nquad1, base1.get() + nquad1, 1, 1.0, &output[1], totmodes);
    }
}

References Blas::Dgemm(), Blas::Dgemv(), Nektar::LibUtilities::StdTriData::getNumberOfCoefficients(), and Vmath::Vmul().

Referenced by Nektar::Collections::IProductWRTDerivBase_SumFac_Tri::operator()(), and Nektar::Collections::IProductWRTBase_SumFac_Tri::operator()().

Variable Documentation

◆ GeomDataNull

CoalescedGeomDataSharedPtr Nektar::Collections::GeomDataNull

static

Definition at line 94 of file CoalescedGeomData.h.

◆ ImplementationTypeMap

const char* const Nektar::Collections::ImplementationTypeMap[]

Initial value:

= {"NoImplementationType",
                                             "NoCollection",
                                             "IterPerExp",
                                             "StdMat",
                                             "SumFac",
                                             "MatrixFree"}

Definition at line 94 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::CollectionOptimisation(), operator<<(), Nektar::Collections::CollectionOptimisation::ReadCollOps(), and Nektar::Collections::CollectionOptimisation::UpdateOptFile().

◆ ImplementationTypeMap1

const char* const Nektar::Collections::ImplementationTypeMap1[]

Initial value:

= {
    "NoImplementationType",
    "IterLocExp", 
    "IterStdExp", 
    "StdMat    ",
    "SumFac    ",
    "MatFree   " 
}

Definition at line 101 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::SetWithTimings().

◆ OperatorTypeMap

const char* const Nektar::Collections::OperatorTypeMap[]

Initial value:

= {"BwdTrans", "Helmholtz",
                                       "IProductWRTBase",
                                       "IProductWRTDerivBase", "PhysDeriv"}

Definition at line 76 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::CollectionOptimisation(), Nektar::Collections::Collection::Initialise(), operator<<(), Nektar::Collections::CollectionOptimisation::ReadCollOps(), and Nektar::Collections::CollectionOptimisation::UpdateOptFile().

◆ OperatorTypeMap1

const char* const Nektar::Collections::OperatorTypeMap1[]

Initial value:

= {"BwdTrans", "Helmholtz", "IPWrtBase",

"IPWrtDBase", "PhysDeriv "}

Definition at line 80 of file Operator.h.

Referenced by Nektar::Collections::CollectionOptimisation::SetWithTimings().

Classes

Typedefs

Enumerations

Functions

Variables

Typedef Documentation

◆ CoalescedGeomDataSharedPtr

◆ CollectionVector

◆ CollectionVectorSharedPtr

◆ ExpansionIsNodal

◆ OperatorFactory

◆ OperatorImpMap

◆ OperatorKey

◆ OperatorSharedPtr

◆ vec_t

◆ VecVec_t

Enumeration Type Documentation

◆ GeomData

◆ ImplementationType

◆ OperatorType

Function Documentation

◆ GetOperatorFactory()

◆ HexIProduct()

◆ operator<()

◆ operator<<()

◆ PrismIProduct()

◆ PyrIProduct()

◆ QuadIProduct()

◆ SetFixedImpType()

◆ TetIProduct()

◆ TriIProduct()

Variable Documentation

◆ GeomDataNull

◆ ImplementationTypeMap

◆ ImplementationTypeMap1

◆ OperatorTypeMap

◆ OperatorTypeMap1