Nektar++
BwdTrans.cpp
Go to the documentation of this file.
1///////////////////////////////////////////////////////////////////////////////
2//
3// File: BwdTrans.cpp
4//
5// For more information, please see: http://www.nektar.info
6//
7// The MIT License
8//
9// Copyright (c) 2006 Division of Applied Mathematics, Brown University (USA),
10// Department of Aeronautics, Imperial College London (UK), and Scientific
11// Computing and Imaging Institute, University of Utah (USA).
12//
13// Permission is hereby granted, free of charge, to any person obtaining a
14// copy of this software and associated documentation files (the "Software"),
15// to deal in the Software without restriction, including without limitation
16// the rights to use, copy, modify, merge, publish, distribute, sublicense,
17// and/or sell copies of the Software, and to permit persons to whom the
18// Software is furnished to do so, subject to the following conditions:
19//
20// The above copyright notice and this permission notice shall be included
21// in all copies or substantial portions of the Software.
22//
23// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
24// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
25// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
26// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
27// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
28// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
29// DEALINGS IN THE SOFTWARE.
30//
31// Description: BwdTrans operator implementations
32//
33///////////////////////////////////////////////////////////////////////////////
34
38
39#include <MatrixFreeOps/Operator.hpp>
40
41using namespace std;
42
44{
45
53
54/**
55 * @brief Backward transform help class to calculate the size of the collection
56 * that is given as an input and as an output to the BwdTrans Operator. The size
57 * evaluation takes into account the conversion from the coefficient space to
58 * the physical space
59 */
60class BwdTrans_Helper : virtual public Operator
61{
62protected:
64 {
65 // expect input to be number of elements by the number of coefficients
66 m_inputSize = m_numElmt * m_stdExp->GetNcoeffs();
67 // expect input to be number of elements by the number of quad points
68 m_outputSize = m_numElmt * m_stdExp->GetTotPoints();
69 }
70};
71
72/**
73 * @brief Backward transform operator using standard matrix approach.
74 */
75class BwdTrans_StdMat final : virtual public Operator,
76 virtual public BwdTrans_Helper
77{
78public:
80
81 ~BwdTrans_StdMat() final = default;
82
83 void operator()(const Array<OneD, const NekDouble> &input,
84 Array<OneD, NekDouble> &output0,
85 [[maybe_unused]] Array<OneD, NekDouble> &output1,
86 [[maybe_unused]] Array<OneD, NekDouble> &output2,
87 [[maybe_unused]] Array<OneD, NekDouble> &wsp) override
88 {
89 Blas::Dgemm('N', 'N', m_mat->GetRows(), m_numElmt, m_mat->GetColumns(),
90 1.0, m_mat->GetRawPtr(), m_mat->GetRows(), input.get(),
91 m_stdExp->GetNcoeffs(), 0.0, output0.get(),
92 m_stdExp->GetTotPoints());
93 }
94
95 void operator()([[maybe_unused]] int dir,
96 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
97 [[maybe_unused]] Array<OneD, NekDouble> &output,
98 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
99 {
100 ASSERTL0(false, "Not valid for this operator.");
101 }
102
104 [[maybe_unused]] int coll_phys_offset) override
105 {
106 ASSERTL0(false, "Not valid for this operator.");
107 }
108
109protected:
111
112private:
113 BwdTrans_StdMat(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
116 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper()
117 {
119 m_stdExp->DetShapeType(), *m_stdExp);
120 m_mat = m_stdExp->GetStdMatrix(key);
121 }
122};
123
124/// Factory initialisation for the BwdTrans_StdMat operators
125OperatorKey BwdTrans_StdMat::m_typeArr[] = {
128 BwdTrans_StdMat::create, "BwdTrans_StdMat_Seg"),
131 BwdTrans_StdMat::create, "BwdTrans_StdMat_Tri"),
134 BwdTrans_StdMat::create, "BwdTrans_StdMat_NodalTri"),
137 BwdTrans_StdMat::create, "BwdTrans_StdMat_Quad"),
140 BwdTrans_StdMat::create, "BwdTrans_StdMat_Tet"),
143 BwdTrans_StdMat::create, "BwdTrans_StdMat_NodalTet"),
146 BwdTrans_StdMat::create, "BwdTrans_StdMat_Pyr"),
148 OperatorKey(ePrism, eBwdTrans, eStdMat, false), BwdTrans_StdMat::create,
149 "BwdTrans_StdMat_Prism"),
151 OperatorKey(ePrism, eBwdTrans, eStdMat, true), BwdTrans_StdMat::create,
152 "BwdTrans_StdMat_NodalPrism"),
155 BwdTrans_StdMat::create, "BwdTrans_StdMat_Hex"),
158 BwdTrans_StdMat::create, "BwdTrans_SumFac_Pyr")};
159
160/**
161 * @brief Backward transform operator using matrix free operators.
162 */
163class BwdTrans_MatrixFree final : virtual public Operator,
165 virtual public BwdTrans_Helper
166{
167public:
169
170 ~BwdTrans_MatrixFree() final = default;
171
172 void operator()(const Array<OneD, const NekDouble> &input,
173 Array<OneD, NekDouble> &output0,
174 [[maybe_unused]] Array<OneD, NekDouble> &output1,
175 [[maybe_unused]] Array<OneD, NekDouble> &output2,
176 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
177 {
178 if (m_isPadded)
179 {
180 // copy into padded vector
181 Vmath::Vcopy(m_nIn, input, 1, m_input, 1);
182 // call op
183 (*m_oper)(m_input, m_output);
184 // copy out of padded vector
185 Vmath::Vcopy(m_nOut, m_output, 1, output0, 1);
186 }
187 else
188 {
189 (*m_oper)(input, output0);
190 }
191 }
192
193 void operator()([[maybe_unused]] int dir,
194 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
195 [[maybe_unused]] Array<OneD, NekDouble> &output,
196 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
197 {
199 "BwdTrans_MatrixFree: Not valid for this operator.");
200 }
201
203 [[maybe_unused]] int coll_phys_offset) override
204 {
205 ASSERTL0(false, "Not valid for this operator.");
206 }
207
208private:
209 std::shared_ptr<MatrixFree::BwdTrans> m_oper;
210
211 BwdTrans_MatrixFree(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
214 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
215 MatrixFreeOneInOneOut(pCollExp[0]->GetStdExp()->GetNcoeffs(),
216 pCollExp[0]->GetStdExp()->GetTotPoints(),
217 pCollExp.size())
218 {
219 // Basis vector.
220 const auto dim = pCollExp[0]->GetStdExp()->GetShapeDimension();
221 std::vector<LibUtilities::BasisSharedPtr> basis(dim);
222 for (auto i = 0; i < dim; ++i)
223 {
224 basis[i] = pCollExp[0]->GetBasis(i);
225 }
226
227 // Get shape type
228 auto shapeType = pCollExp[0]->GetStdExp()->DetShapeType();
229
230 // Generate operator string and create operator.
231 std::string op_string = "BwdTrans";
232 op_string += MatrixFree::GetOpstring(shapeType, false);
234 op_string, basis, m_nElmtPad);
235
236 m_oper = std::dynamic_pointer_cast<MatrixFree::BwdTrans>(oper);
237 ASSERTL0(m_oper, "Failed to cast pointer.");
238 }
239};
240
241/// Factory initialisation for the BwdTrans_MatrixFree operators
242OperatorKey BwdTrans_MatrixFree::m_typeArr[] = {
245 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Seg"),
248 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Quad"),
251 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Tri"),
254 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Hex"),
257 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Prism"),
260 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Tet"),
263 BwdTrans_MatrixFree::create, "BwdTrans_MatrixFree_Pyr")};
264
265/**
266 * @brief Backward transform operator using default StdRegions operator
267 */
268class BwdTrans_IterPerExp final : virtual public Operator,
269 virtual public BwdTrans_Helper
270{
271public:
273
274 ~BwdTrans_IterPerExp() final = default;
275
276 void operator()(const Array<OneD, const NekDouble> &input,
277 Array<OneD, NekDouble> &output0,
278 [[maybe_unused]] Array<OneD, NekDouble> &output1,
279 [[maybe_unused]] Array<OneD, NekDouble> &output2,
280 [[maybe_unused]] Array<OneD, NekDouble> &wsp) override
281 {
282 const int nCoeffs = m_stdExp->GetNcoeffs();
283 const int nPhys = m_stdExp->GetTotPoints();
285
286 for (int i = 0; i < m_numElmt; ++i)
287 {
288 m_stdExp->BwdTrans(input + i * nCoeffs, tmp = output0 + i * nPhys);
289 }
290 }
291
292 void operator()([[maybe_unused]] int dir,
293 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
294 [[maybe_unused]] Array<OneD, NekDouble> &output,
295 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
296 {
297 ASSERTL0(false, "Not valid for this operator.");
298 }
299
301 [[maybe_unused]] int coll_phys_offset) override
302 {
303 ASSERTL0(false, "Not valid for this operator.");
304 }
305
306private:
307 BwdTrans_IterPerExp(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
310 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper()
311 {
312 }
313};
314
315/// Factory initialisation for the BwdTrans_IterPerExp operators
316OperatorKey BwdTrans_IterPerExp::m_typeArr[] = {
319 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Seg"),
322 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Tri"),
325 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_NodalTri"),
328 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Quad"),
331 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Tet"),
334 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_NodalTet"),
337 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Pyr"),
340 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Prism"),
343 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_NodalPrism"),
346 BwdTrans_IterPerExp::create, "BwdTrans_IterPerExp_Hex"),
347};
348
349/**
350 * @brief Backward transform operator using LocalRegions implementation.
351 */
352class BwdTrans_NoCollection final : virtual public Operator,
353 virtual public BwdTrans_Helper
354{
355public:
357
358 ~BwdTrans_NoCollection() final = default;
359
360 void operator()(const Array<OneD, const NekDouble> &input,
361 Array<OneD, NekDouble> &output0,
362 [[maybe_unused]] Array<OneD, NekDouble> &output1,
363 [[maybe_unused]] Array<OneD, NekDouble> &output2,
364 [[maybe_unused]] Array<OneD, NekDouble> &wsp) override
365 {
366 const int nCoeffs = m_expList[0]->GetNcoeffs();
367 const int nPhys = m_expList[0]->GetTotPoints();
369
370 for (int i = 0; i < m_numElmt; ++i)
371 {
372 m_expList[i]->BwdTrans(input + i * nCoeffs,
373 tmp = output0 + i * nPhys);
374 }
375 }
376
377 void operator()([[maybe_unused]] int dir,
378 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
379 [[maybe_unused]] Array<OneD, NekDouble> &output,
380 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
381 {
382 ASSERTL0(false, "Not valid for this operator.");
383 }
384
386 [[maybe_unused]] int coll_phys_offset) override
387 {
388 ASSERTL0(false, "Not valid for this operator.");
389 }
390
391protected:
392 vector<StdRegions::StdExpansionSharedPtr> m_expList;
393
394private:
395 BwdTrans_NoCollection(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
398 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper()
399 {
400 m_expList = pCollExp;
401 }
402};
403
404/// Factory initialisation for the BwdTrans_NoCollection operators
405OperatorKey BwdTrans_NoCollection::m_typeArr[] = {
408 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Seg"),
411 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Tri"),
414 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_NodalTri"),
417 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Quad"),
420 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Tet"),
423 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_NodalTet"),
426 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Pyr"),
429 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Prism"),
432 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_NodalPrism"),
435 BwdTrans_NoCollection::create, "BwdTrans_NoCollection_Hex"),
436};
437
438/**
439 * @brief Backward transform operator using sum-factorisation (Segment)
440 */
441class BwdTrans_SumFac_Seg final : virtual public Operator,
442 virtual public BwdTrans_Helper
443{
444public:
446
447 ~BwdTrans_SumFac_Seg() final = default;
448
449 void operator()(const Array<OneD, const NekDouble> &input,
450 Array<OneD, NekDouble> &output0,
451 [[maybe_unused]] Array<OneD, NekDouble> &output1,
452 [[maybe_unused]] Array<OneD, NekDouble> &output2,
453 [[maybe_unused]] Array<OneD, NekDouble> &wsp) override
454 {
455 if (m_colldir0)
456 {
457 Vmath::Vcopy(m_numElmt * m_nmodes0, input.get(), 1, output0.get(),
458 1);
459 }
460 else
461 {
462 // out = B0*in;
463 Blas::Dgemm('N', 'N', m_nquad0, m_numElmt, m_nmodes0, 1.0,
464 m_base0.get(), m_nquad0, &input[0], m_nmodes0, 0.0,
465 &output0[0], m_nquad0);
466 }
467 }
468
469 void operator()([[maybe_unused]] int dir,
470 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
471 [[maybe_unused]] Array<OneD, NekDouble> &output,
472 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
473 {
474 ASSERTL0(false, "Not valid for this operator.");
475 }
476
478 [[maybe_unused]] int coll_phys_offset) override
479 {
480 ASSERTL0(false, "Not valid for this operator.");
481 }
482
483protected:
484 const int m_nquad0;
485 const int m_nmodes0;
486 const bool m_colldir0;
488
489private:
490 BwdTrans_SumFac_Seg(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
493 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
494 m_nquad0(m_stdExp->GetNumPoints(0)),
495 m_nmodes0(m_stdExp->GetBasisNumModes(0)),
496 m_colldir0(m_stdExp->GetBasis(0)->Collocation()),
497 m_base0(m_stdExp->GetBasis(0)->GetBdata())
498 {
499 m_wspSize = 0;
500 }
501};
502
503/// Factory initialisation for the BwdTrans_SumFac_Seg operator
504OperatorKey BwdTrans_SumFac_Seg::m_type =
507 BwdTrans_SumFac_Seg::create, "BwdTrans_SumFac_Seg");
508
509/**
510 * @brief Backward transform operator using sum-factorisation (Quad)
511 */
512class BwdTrans_SumFac_Quad final : virtual public Operator,
513 virtual public BwdTrans_Helper
514{
515public:
517
518 ~BwdTrans_SumFac_Quad() final = default;
519
520 void operator()(const Array<OneD, const NekDouble> &input,
521 Array<OneD, NekDouble> &output0,
522 [[maybe_unused]] Array<OneD, NekDouble> &output1,
523 [[maybe_unused]] Array<OneD, NekDouble> &output2,
524 Array<OneD, NekDouble> &wsp) override
525 {
526 int i = 0;
527 if (m_colldir0 && m_colldir1)
528 {
529 Vmath::Vcopy(m_numElmt * m_nmodes0 * m_nmodes1, input.get(), 1,
530 output0.get(), 1);
531 }
532 else if (m_colldir0)
533 {
534 for (i = 0; i < m_numElmt; ++i)
535 {
536 Blas::Dgemm('N', 'T', m_nquad0, m_nquad1, m_nmodes1, 1.0,
537 &input[i * m_nquad0 * m_nmodes1], m_nquad0,
538 m_base1.get(), m_nquad1, 0.0,
539 &output0[i * m_nquad0 * m_nquad1], m_nquad0);
540 }
541 }
542 else if (m_colldir1)
543 {
545 1.0, m_base0.get(), m_nquad0, &input[0], m_nmodes0, 0.0,
546 &output0[0], m_nquad0);
547 }
548 else
549 {
550 ASSERTL1(wsp.size() == m_wspSize, "Incorrect workspace size");
551
552 // Those two calls correpsond to the operation
553 // out = B0*in*Transpose(B1);
555 1.0, m_base0.get(), m_nquad0, &input[0], m_nmodes0, 0.0,
556 &wsp[0], m_nquad0);
557
558 for (i = 0; i < m_numElmt; ++i)
559 {
560 Blas::Dgemm('N', 'T', m_nquad0, m_nquad1, m_nmodes1, 1.0,
561 &wsp[i * m_nquad0 * m_nmodes1], m_nquad0,
562 m_base1.get(), m_nquad1, 0.0,
563 &output0[i * m_nquad0 * m_nquad1], m_nquad0);
564 }
565 }
566 }
567
568 void operator()([[maybe_unused]] int dir,
569 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
570 [[maybe_unused]] Array<OneD, NekDouble> &output,
571 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
572 {
573 ASSERTL0(false, "Not valid for this operator.");
574 }
575
577 [[maybe_unused]] int coll_phys_offset) override
578 {
579 ASSERTL0(false, "Not valid for this operator.");
580 }
581
582protected:
583 const int m_nquad0;
584 const int m_nquad1;
585 const int m_nmodes0;
586 const int m_nmodes1;
587 const bool m_colldir0;
588 const bool m_colldir1;
591
592private:
593 BwdTrans_SumFac_Quad(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
596 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
597 m_nquad0(m_stdExp->GetNumPoints(0)),
598 m_nquad1(m_stdExp->GetNumPoints(1)),
599 m_nmodes0(m_stdExp->GetBasisNumModes(0)),
600 m_nmodes1(m_stdExp->GetBasisNumModes(1)),
601 m_colldir0(m_stdExp->GetBasis(0)->Collocation()),
602 m_colldir1(m_stdExp->GetBasis(1)->Collocation()),
603 m_base0(m_stdExp->GetBasis(0)->GetBdata()),
604 m_base1(m_stdExp->GetBasis(1)->GetBdata())
605 {
607 }
608};
609
610/// Factory initialisation for the BwdTrans_SumFac_Quad operator
611OperatorKey BwdTrans_SumFac_Quad::m_type =
614 BwdTrans_SumFac_Quad::create, "BwdTrans_SumFac_Quad");
615
616/**
617 * @brief Backward transform operator using sum-factorisation (Tri)
618 */
619class BwdTrans_SumFac_Tri final : virtual public Operator,
620 virtual public BwdTrans_Helper
621{
622public:
624
625 ~BwdTrans_SumFac_Tri() final = default;
626
627 void operator()(const Array<OneD, const NekDouble> &input,
628 Array<OneD, NekDouble> &output0,
629 [[maybe_unused]] Array<OneD, NekDouble> &output1,
630 [[maybe_unused]] Array<OneD, NekDouble> &output2,
631 Array<OneD, NekDouble> &wsp) override
632 {
633 ASSERTL1(wsp.size() == m_wspSize, "Incorrect workspace size");
634
635 int ncoeffs = m_stdExp->GetNcoeffs();
636 int i = 0;
637 int mode = 0;
638
639 for (i = mode = 0; i < m_nmodes0; ++i)
640 {
641 Blas::Dgemm('N', 'N', m_nquad1, m_numElmt, m_nmodes1 - i, 1.0,
642 m_base1.get() + mode * m_nquad1, m_nquad1,
643 &input[0] + mode, ncoeffs, 0.0,
644 &wsp[i * m_nquad1 * m_numElmt], m_nquad1);
645 mode += m_nmodes1 - i;
646 }
647
648 // fix for modified basis by splitting top vertex mode
649 if (m_sortTopVertex)
650 {
651 for (i = 0; i < m_numElmt; ++i)
652 {
653 Blas::Daxpy(m_nquad1, input[1 + i * ncoeffs],
654 m_base1.get() + m_nquad1, 1,
655 &wsp[m_nquad1 * m_numElmt] + i * m_nquad1, 1);
656 }
657 }
658
660 m_base0.get(), m_nquad0, &wsp[0], m_nquad1 * m_numElmt, 0.0,
661 &output0[0], m_nquad0);
662 }
663
664 void operator()([[maybe_unused]] int dir,
665 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
666 [[maybe_unused]] Array<OneD, NekDouble> &output,
667 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
668 {
669 ASSERTL0(false, "Not valid for this operator.");
670 }
671
673 [[maybe_unused]] int coll_phys_offset) override
674 {
675 ASSERTL0(false, "Not valid for this operator.");
676 }
677
678protected:
679 const int m_nquad0;
680 const int m_nquad1;
681 const int m_nmodes0;
682 const int m_nmodes1;
686
687private:
688 BwdTrans_SumFac_Tri(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
691 : Operator(pCollExp, pGeomData, factors),
692 m_nquad0(m_stdExp->GetNumPoints(0)),
693 m_nquad1(m_stdExp->GetNumPoints(1)),
694 m_nmodes0(m_stdExp->GetBasisNumModes(0)),
695 m_nmodes1(m_stdExp->GetBasisNumModes(1)),
696 m_base0(m_stdExp->GetBasis(0)->GetBdata()),
697 m_base1(m_stdExp->GetBasis(1)->GetBdata())
698 {
700 if (m_stdExp->GetBasis(0)->GetBasisType() == LibUtilities::eModified_A)
701 {
702 m_sortTopVertex = true;
703 }
704 else
705 {
706 m_sortTopVertex = false;
707 }
708 }
709};
710
711/// Factory initialisation for the BwdTrans_SumFac_Tri operator
712OperatorKey BwdTrans_SumFac_Tri::m_type =
715 BwdTrans_SumFac_Tri::create, "BwdTrans_SumFac_Tri");
716
717/// Backward transform operator using sum-factorisation (Hex)
718class BwdTrans_SumFac_Hex final : virtual public Operator,
719 virtual public BwdTrans_Helper
720{
721public:
723
724 ~BwdTrans_SumFac_Hex() final = default;
725
726 void operator()(const Array<OneD, const NekDouble> &input,
727 Array<OneD, NekDouble> &output0,
728 [[maybe_unused]] Array<OneD, NekDouble> &output1,
729 [[maybe_unused]] Array<OneD, NekDouble> &output2,
730 Array<OneD, NekDouble> &wsp) override
731 {
733 {
735 input.get(), 1, output0.get(), 1);
736 }
737 else
738 {
739 ASSERTL1(wsp.size() == m_wspSize, "Incorrect workspace size");
740
741 // Assign second half of workspace for 2nd DGEMM operation.
742 int totmodes = m_nmodes0 * m_nmodes1 * m_nmodes2;
743
746
747 // loop over elements and do bwd trans wrt c
748 for (int n = 0; n < m_numElmt; ++n)
749 {
751 m_nmodes2, 1.0, m_base2.get(), m_nquad2,
752 &input[n * totmodes], m_nmodes0 * m_nmodes1, 0.0,
753 &wsp[n * m_nquad2], m_nquad2 * m_numElmt);
754 }
755
756 // trans wrt b
758 m_nmodes1, 1.0, m_base1.get(), m_nquad1, wsp.get(),
759 m_nquad2 * m_numElmt * m_nmodes0, 0.0, wsp2.get(),
760 m_nquad1);
761
762 // trans wrt a
764 m_nmodes0, 1.0, m_base0.get(), m_nquad0, wsp2.get(),
765 m_nquad1 * m_nquad2 * m_numElmt, 0.0, output0.get(),
766 m_nquad0);
767 }
768 }
769
770 void operator()([[maybe_unused]] int dir,
771 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
772 [[maybe_unused]] Array<OneD, NekDouble> &output,
773 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
774 {
775 ASSERTL0(false, "Not valid for this operator.");
776 }
777
779 [[maybe_unused]] int coll_phys_offset) override
780 {
781 ASSERTL0(false, "Not valid for this operator.");
782 }
783
784protected:
785 const int m_nquad0;
786 const int m_nquad1;
787 const int m_nquad2;
788 const int m_nmodes0;
789 const int m_nmodes1;
790 const int m_nmodes2;
794 const bool m_colldir0;
795 const bool m_colldir1;
796 const bool m_colldir2;
797
798private:
799 BwdTrans_SumFac_Hex(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
802 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
803 m_nquad0(pCollExp[0]->GetNumPoints(0)),
804 m_nquad1(pCollExp[0]->GetNumPoints(1)),
805 m_nquad2(pCollExp[0]->GetNumPoints(2)),
806 m_nmodes0(pCollExp[0]->GetBasisNumModes(0)),
807 m_nmodes1(pCollExp[0]->GetBasisNumModes(1)),
808 m_nmodes2(pCollExp[0]->GetBasisNumModes(2)),
809 m_base0(pCollExp[0]->GetBasis(0)->GetBdata()),
810 m_base1(pCollExp[0]->GetBasis(1)->GetBdata()),
811 m_base2(pCollExp[0]->GetBasis(2)->GetBdata()),
812 m_colldir0(pCollExp[0]->GetBasis(0)->Collocation()),
813 m_colldir1(pCollExp[0]->GetBasis(1)->Collocation()),
814 m_colldir2(pCollExp[0]->GetBasis(2)->Collocation())
815 {
818 }
819};
820
821/// Factory initialisation for the BwdTrans_SumFac_Hex operator
822OperatorKey BwdTrans_SumFac_Hex::m_type =
825 BwdTrans_SumFac_Hex::create, "BwdTrans_SumFac_Hex");
826
827/**
828 * @brief Backward transform operator using sum-factorisation (Tet)
829 */
830class BwdTrans_SumFac_Tet final : virtual public Operator,
831 virtual public BwdTrans_Helper
832{
833public:
835
836 ~BwdTrans_SumFac_Tet() final = default;
837
838 void operator()(const Array<OneD, const NekDouble> &input,
839 Array<OneD, NekDouble> &output0,
840 [[maybe_unused]] Array<OneD, NekDouble> &output1,
841 [[maybe_unused]] Array<OneD, NekDouble> &output2,
842 Array<OneD, NekDouble> &wsp) final
843 {
844 ASSERTL1(wsp.size() == m_wspSize, "Incorrect workspace size");
845
846 Array<OneD, NekDouble> tmp = wsp;
848 tmp + m_numElmt * m_nquad2 * m_nmodes0 *
849 (2 * m_nmodes1 - m_nmodes0 + 1) / 2;
850
851 int mode = 0;
852 int mode1 = 0;
853 int cnt = 0;
854 int ncoeffs = m_stdExp->GetNcoeffs();
855
856 // Perform summation over '2' direction
857 for (int i = 0; i < m_nmodes0; ++i)
858 {
859 for (int j = 0; j < m_nmodes1 - i; ++j, ++cnt)
860 {
861 Blas::Dgemm('N', 'N', m_nquad2, m_numElmt, m_nmodes2 - i - j,
862 1.0, m_base2.get() + mode * m_nquad2, m_nquad2,
863 input.get() + mode1, ncoeffs, 0.0,
864 tmp.get() + cnt * m_nquad2 * m_numElmt, m_nquad2);
865 mode += m_nmodes2 - i - j;
866 mode1 += m_nmodes2 - i - j;
867 }
868
869 // increment mode in case m_nmodes1!=m_nmodes2
870 mode += (m_nmodes2 - m_nmodes1) * (m_nmodes2 - m_nmodes1 + 1) / 2;
871 }
872
873 // vertex mode - currently (1+c)/2 x (1-b)/2 x (1-a)/2
874 // component is evaluated
875 if (m_sortTopEdge)
876 {
877 for (int i = 0; i < m_numElmt; ++i)
878 {
879 // top singular vertex
880 // (1+c)/2 x (1+b)/2 x (1-a)/2 component
881 Blas::Daxpy(m_nquad2, input[1 + i * ncoeffs],
882 m_base2.get() + m_nquad2, 1,
883 &tmp[m_nquad2 * m_numElmt] + i * m_nquad2, 1);
884
885 // top singular vertex
886 // (1+c)/2 x (1-b)/2 x (1+a)/2 component
888 m_nquad2, input[1 + i * ncoeffs], m_base2.get() + m_nquad2,
889 1, &tmp[m_nmodes1 * m_nquad2 * m_numElmt] + i * m_nquad2,
890 1);
891 }
892 }
893
894 // Perform summation over '1' direction
895 mode = 0;
896 for (int i = 0; i < m_nmodes0; ++i)
897 {
899 1.0, m_base1.get() + mode * m_nquad1, m_nquad1,
900 tmp.get() + mode * m_nquad2 * m_numElmt,
901 m_nquad2 * m_numElmt, 0.0,
902 tmp1.get() + i * m_nquad1 * m_nquad2 * m_numElmt,
903 m_nquad1);
904 mode += m_nmodes1 - i;
905 }
906
907 // fix for modified basis by adding additional split of
908 // top and base singular vertex modes as well as singular
909 // edge
910 if (m_sortTopEdge)
911 {
912 // this could probably be a dgemv or higher if we
913 // made a specialised m_base1[m_nuqad1] array
914 // containing multiply copies
915 for (int i = 0; i < m_numElmt; ++i)
916 {
917 // sort out singular vertices and singular
918 // edge components with (1+b)/2 (1+a)/2 form
919 for (int j = 0; j < m_nquad2; ++j)
920 {
922 tmp[m_nquad2 * m_numElmt + i * m_nquad2 + j],
923 m_base1.get() + m_nquad1, 1,
924 &tmp1[m_nquad1 * m_nquad2 * m_numElmt] +
925 i * m_nquad1 * m_nquad2 + j * m_nquad1,
926 1);
927 }
928 }
929 }
930
931 // Perform summation over '0' direction
933 m_nmodes0, 1.0, m_base0.get(), m_nquad0, tmp1.get(),
934 m_nquad1 * m_nquad2 * m_numElmt, 0.0, output0.get(),
935 m_nquad0);
936 }
937
938 void operator()([[maybe_unused]] int dir,
939 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
940 [[maybe_unused]] Array<OneD, NekDouble> &output,
941 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
942 {
943 ASSERTL0(false, "Not valid for this operator.");
944 }
945
947 [[maybe_unused]] int coll_phys_offset) override
948 {
949 ASSERTL0(false, "Not valid for this operator.");
950 }
951
952protected:
953 const int m_nquad0;
954 const int m_nquad1;
955 const int m_nquad2;
956 const int m_nmodes0;
957 const int m_nmodes1;
958 const int m_nmodes2;
963
964private:
965 BwdTrans_SumFac_Tet(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
968 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
969 m_nquad0(m_stdExp->GetNumPoints(0)),
970 m_nquad1(m_stdExp->GetNumPoints(1)),
971 m_nquad2(m_stdExp->GetNumPoints(2)),
972 m_nmodes0(m_stdExp->GetBasisNumModes(0)),
973 m_nmodes1(m_stdExp->GetBasisNumModes(1)),
974 m_nmodes2(m_stdExp->GetBasisNumModes(2)),
975 m_base0(m_stdExp->GetBasis(0)->GetBdata()),
976 m_base1(m_stdExp->GetBasis(1)->GetBdata()),
977 m_base2(m_stdExp->GetBasis(2)->GetBdata())
978 {
980 (2 * m_nmodes1 - m_nmodes0 + 1) / 2 +
982
983 if (m_stdExp->GetBasis(0)->GetBasisType() == LibUtilities::eModified_A)
984 {
985 m_sortTopEdge = true;
986 }
987 else
988 {
989 m_sortTopEdge = false;
990 }
991 }
992};
993
994/// Factory initialisation for the BwdTrans_SumFac_Tet operator
995OperatorKey BwdTrans_SumFac_Tet::m_type =
998 BwdTrans_SumFac_Tet::create, "BwdTrans_SumFac_Tet");
999
1000/**
1001 * @brief Backward transform operator using sum-factorisation (Prism)
1002 */
1003class BwdTrans_SumFac_Prism final : virtual public Operator,
1004 virtual public BwdTrans_Helper
1005{
1006public:
1008
1009 ~BwdTrans_SumFac_Prism() final = default;
1010
1011 void operator()(const Array<OneD, const NekDouble> &input,
1012 Array<OneD, NekDouble> &output0,
1013 [[maybe_unused]] Array<OneD, NekDouble> &output1,
1014 [[maybe_unused]] Array<OneD, NekDouble> &output2,
1015 Array<OneD, NekDouble> &wsp) final
1016 {
1017 ASSERTL1(wsp.size() == m_wspSize, "Incorrect workspace size");
1018
1019 // Assign second half of workspace for 2nd DGEMM operation.
1020 int totmodes = m_stdExp->GetNcoeffs();
1021
1024
1026 int i = 0;
1027 int j = 0;
1028 int mode = 0;
1029 int mode1 = 0;
1030 int cnt = 0;
1031 for (i = mode = mode1 = 0; i < m_nmodes0; ++i)
1032 {
1033 cnt = i * m_nquad2 * m_numElmt;
1034 for (j = 0; j < m_nmodes1; ++j)
1035 {
1036 Blas::Dgemm('N', 'N', m_nquad2, m_numElmt, m_nmodes2 - i, 1.0,
1037 m_base2.get() + mode * m_nquad2, m_nquad2,
1038 input.get() + mode1, totmodes, 0.0,
1039 &wsp[j * m_nquad2 * m_numElmt * m_nmodes0 + cnt],
1040 m_nquad2);
1041 mode1 += m_nmodes2 - i;
1042 }
1043 mode += m_nmodes2 - i;
1044 }
1045
1046 // fix for modified basis by splitting top vertex mode
1047 if (m_sortTopVertex)
1048 {
1049 for (j = 0; j < m_nmodes1; ++j)
1050 {
1051 for (i = 0; i < m_numElmt; ++i)
1052 {
1054 input[1 + i * totmodes + j * m_nmodes2],
1055 m_base2.get() + m_nquad2, 1,
1056 &wsp[j * m_nquad2 * m_numElmt * m_nmodes0 +
1057 m_nquad2 * m_numElmt] +
1058 i * m_nquad2,
1059 1);
1060 }
1061 }
1062 // Believe this could be made into a m_nmodes1
1063 // dgemv if we made an array of m_numElmt copies
1064 // of m_base2[m_quad2] (which are of size
1065 // m_nquad2.
1066 }
1067
1068 // Perform summation over '1' direction
1070 m_nmodes1, 1.0, m_base1.get(), m_nquad1, wsp.get(),
1071 m_nquad2 * m_numElmt * m_nmodes0, 0.0, wsp2.get(),
1072 m_nquad1);
1073
1074 // Perform summation over '0' direction
1076 m_nmodes0, 1.0, m_base0.get(), m_nquad0, wsp2.get(),
1077 m_nquad1 * m_nquad2 * m_numElmt, 0.0, output0.get(),
1078 m_nquad0);
1079 }
1080
1081 void operator()([[maybe_unused]] int dir,
1082 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
1083 [[maybe_unused]] Array<OneD, NekDouble> &output,
1084 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
1085 {
1086 ASSERTL0(false, "Not valid for this operator.");
1087 }
1088
1090 [[maybe_unused]] int coll_phys_offset) override
1091 {
1092 ASSERTL0(false, "Not valid for this operator.");
1093 }
1094
1095protected:
1096 const int m_nquad0;
1097 const int m_nquad1;
1098 const int m_nquad2;
1099 const int m_nmodes0;
1100 const int m_nmodes1;
1101 const int m_nmodes2;
1106
1107private:
1108 BwdTrans_SumFac_Prism(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
1111 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
1112 m_nquad0(m_stdExp->GetNumPoints(0)),
1113 m_nquad1(m_stdExp->GetNumPoints(1)),
1114 m_nquad2(m_stdExp->GetNumPoints(2)),
1115 m_nmodes0(m_stdExp->GetBasisNumModes(0)),
1116 m_nmodes1(m_stdExp->GetBasisNumModes(1)),
1117 m_nmodes2(m_stdExp->GetBasisNumModes(2)),
1118 m_base0(m_stdExp->GetBasis(0)->GetBdata()),
1119 m_base1(m_stdExp->GetBasis(1)->GetBdata()),
1120 m_base2(m_stdExp->GetBasis(2)->GetBdata())
1121 {
1124
1125 if (m_stdExp->GetBasis(0)->GetBasisType() == LibUtilities::eModified_A)
1126 {
1127 m_sortTopVertex = true;
1128 }
1129 else
1130 {
1131 m_sortTopVertex = false;
1132 }
1133 }
1134};
1135
1136/// Factory initialisation for the BwdTrans_SumFac_Prism operator
1137OperatorKey BwdTrans_SumFac_Prism::m_type =
1140 BwdTrans_SumFac_Prism::create, "BwdTrans_SumFac_Prism");
1141
1142/**
1143 * @brief Backward transform operator using sum-factorisation (Pyr)
1144 */
1145class BwdTrans_SumFac_Pyr final : virtual public Operator,
1146 virtual public BwdTrans_Helper
1147{
1148public:
1150
1151 ~BwdTrans_SumFac_Pyr() final = default;
1152
1153 void operator()(const Array<OneD, const NekDouble> &input,
1154 Array<OneD, NekDouble> &output0,
1155 [[maybe_unused]] Array<OneD, NekDouble> &output1,
1156 [[maybe_unused]] Array<OneD, NekDouble> &output2,
1157 Array<OneD, NekDouble> &wsp) final
1158 {
1159 ASSERTL1(wsp.size() == m_wspSize, "Incorrect workspace size");
1160
1161 // Assign second half of workspace for 2nd DGEMM operation.
1162 int totmodes = m_stdExp->GetNcoeffs();
1163
1166
1168 int i = 0;
1169 int j = 0;
1170 int mode = 0;
1171 int mode1 = 0;
1172 int cnt = 0;
1173 for (i = 0; i < m_nmodes0; ++i)
1174 {
1175 for (j = 0; j < m_nmodes1; ++j, ++cnt)
1176 {
1177 int ijmax = max(i, j);
1178 Blas::Dgemm('N', 'N', m_nquad2, m_numElmt, m_nmodes2 - ijmax,
1179 1.0, m_base2.get() + mode * m_nquad2, m_nquad2,
1180 input.get() + mode1, totmodes, 0.0,
1181 wsp.get() + cnt * m_nquad2 * m_numElmt, m_nquad2);
1182 mode += m_nmodes2 - ijmax;
1183 mode1 += m_nmodes2 - ijmax;
1184 }
1185
1186 // increment mode in case order1!=order2
1187 for (j = m_nmodes1; j < m_nmodes2 - i; ++j)
1188 {
1189 int ijmax = max(i, j);
1190 mode += m_nmodes2 - ijmax;
1191 }
1192 }
1193
1194 // vertex mode - currently (1+c)/2 x (1-b)/2 x (1-a)/2
1195 // component is evaluated
1196 if (m_sortTopVertex)
1197 {
1198 for (i = 0; i < m_numElmt; ++i)
1199 {
1200 // top singular vertex
1201 // (1+c)/2 x (1+b)/2 x (1-a)/2 component
1202 Blas::Daxpy(m_nquad2, input[1 + i * totmodes],
1203 m_base2.get() + m_nquad2, 1,
1204 &wsp[m_nquad2 * m_numElmt] + i * m_nquad2, 1);
1205
1206 // top singular vertex
1207 // (1+c)/2 x (1-b)/2 x (1+a)/2 component
1209 m_nquad2, input[1 + i * totmodes], m_base2.get() + m_nquad2,
1210 1, &wsp[m_nmodes1 * m_nquad2 * m_numElmt] + i * m_nquad2,
1211 1);
1212
1213 // top singular vertex
1214 // (1+c)/2 x (1+b)/2 x (1+a)/2 component
1215 Blas::Daxpy(m_nquad2, input[1 + i * totmodes],
1216 m_base2.get() + m_nquad2, 1,
1217 &wsp[(m_nmodes1 + 1) * m_nquad2 * m_numElmt] +
1218 i * m_nquad2,
1219 1);
1220 }
1221 }
1222
1223 // Perform summation over '1' direction
1224 mode = 0;
1225 for (i = 0; i < m_nmodes0; ++i)
1226 {
1228 1.0, m_base1.get(), m_nquad1,
1229 wsp.get() + mode * m_nquad2 * m_numElmt,
1230 m_nquad2 * m_numElmt, 0.0,
1231 wsp2.get() + i * m_nquad1 * m_nquad2 * m_numElmt,
1232 m_nquad1);
1233 mode += m_nmodes1;
1234 }
1235
1236 // Perform summation over '0' direction
1238 m_nmodes0, 1.0, m_base0.get(), m_nquad0, wsp2.get(),
1239 m_nquad1 * m_nquad2 * m_numElmt, 0.0, output0.get(),
1240 m_nquad0);
1241 }
1242
1243 void operator()([[maybe_unused]] int dir,
1244 [[maybe_unused]] const Array<OneD, const NekDouble> &input,
1245 [[maybe_unused]] Array<OneD, NekDouble> &output,
1246 [[maybe_unused]] Array<OneD, NekDouble> &wsp) final
1247 {
1248 ASSERTL0(false, "Not valid for this operator.");
1249 }
1250
1252 [[maybe_unused]] int coll_phys_offset) override
1253 {
1254 ASSERTL0(false, "Not valid for this operator.");
1255 }
1256
1257protected:
1258 const int m_nquad0;
1259 const int m_nquad1;
1260 const int m_nquad2;
1261 const int m_nmodes0;
1262 const int m_nmodes1;
1263 const int m_nmodes2;
1268
1269private:
1270 BwdTrans_SumFac_Pyr(vector<StdRegions::StdExpansionSharedPtr> pCollExp,
1273 : Operator(pCollExp, pGeomData, factors), BwdTrans_Helper(),
1274 m_nquad0(m_stdExp->GetNumPoints(0)),
1275 m_nquad1(m_stdExp->GetNumPoints(1)),
1276 m_nquad2(m_stdExp->GetNumPoints(2)),
1277 m_nmodes0(m_stdExp->GetBasisNumModes(0)),
1278 m_nmodes1(m_stdExp->GetBasisNumModes(1)),
1279 m_nmodes2(m_stdExp->GetBasisNumModes(2)),
1280 m_base0(m_stdExp->GetBasis(0)->GetBdata()),
1281 m_base1(m_stdExp->GetBasis(1)->GetBdata()),
1282 m_base2(m_stdExp->GetBasis(2)->GetBdata())
1283 {
1285
1286 if (m_stdExp->GetBasis(0)->GetBasisType() == LibUtilities::eModified_A)
1287 {
1288 m_sortTopVertex = true;
1289 }
1290 else
1291 {
1292 m_sortTopVertex = false;
1293 }
1294 }
1295};
1296
1297/// Factory initialisation for the BwdTrans_SumFac_Pyr operator
1298OperatorKey BwdTrans_SumFac_Pyr::m_type =
1301 BwdTrans_SumFac_Pyr::create, "BwdTrans_SumFac_Pyr");
1302
1303} // namespace Nektar::Collections
#define ASSERTL0(condition, msg)
Definition: ErrorUtil.hpp:208
#define NEKERROR(type, msg)
Assert Level 0 – Fundamental assert which is used whether in FULLDEBUG, DEBUG or OPT compilation mode...
Definition: ErrorUtil.hpp:202
#define ASSERTL1(condition, msg)
Assert Level 1 – Debugging which is used whether in FULLDEBUG or DEBUG compilation mode....
Definition: ErrorUtil.hpp:242
#define OPERATOR_CREATE(cname)
Definition: Operator.h:43
Backward transform help class to calculate the size of the collection that is given as an input and a...
Definition: BwdTrans.cpp:61
Backward transform operator using default StdRegions operator.
Definition: BwdTrans.cpp:270
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:292
BwdTrans_IterPerExp(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:307
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:300
Backward transform operator using matrix free operators.
Definition: BwdTrans.cpp:166
std::shared_ptr< MatrixFree::BwdTrans > m_oper
Definition: BwdTrans.cpp:209
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:202
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:193
BwdTrans_MatrixFree(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:211
Backward transform operator using LocalRegions implementation.
Definition: BwdTrans.cpp:354
BwdTrans_NoCollection(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:395
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:385
vector< StdRegions::StdExpansionSharedPtr > m_expList
Definition: BwdTrans.cpp:392
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:377
Backward transform operator using standard matrix approach.
Definition: BwdTrans.cpp:77
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:95
BwdTrans_StdMat(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:113
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:103
Backward transform operator using sum-factorisation (Hex)
Definition: BwdTrans.cpp:720
Array< OneD, const NekDouble > m_base1
Definition: BwdTrans.cpp:792
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:778
Array< OneD, const NekDouble > m_base2
Definition: BwdTrans.cpp:793
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:791
BwdTrans_SumFac_Hex(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:799
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:770
Backward transform operator using sum-factorisation (Prism)
Definition: BwdTrans.cpp:1005
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:1081
BwdTrans_SumFac_Prism(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:1108
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:1102
Array< OneD, const NekDouble > m_base1
Definition: BwdTrans.cpp:1103
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:1089
Array< OneD, const NekDouble > m_base2
Definition: BwdTrans.cpp:1104
Backward transform operator using sum-factorisation (Pyr)
Definition: BwdTrans.cpp:1147
Array< OneD, const NekDouble > m_base2
Definition: BwdTrans.cpp:1266
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:1243
BwdTrans_SumFac_Pyr(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:1270
Array< OneD, const NekDouble > m_base1
Definition: BwdTrans.cpp:1265
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:1264
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:1251
Backward transform operator using sum-factorisation (Quad)
Definition: BwdTrans.cpp:514
Array< OneD, const NekDouble > m_base1
Definition: BwdTrans.cpp:590
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:568
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:589
BwdTrans_SumFac_Quad(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:593
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:576
Backward transform operator using sum-factorisation (Segment)
Definition: BwdTrans.cpp:443
BwdTrans_SumFac_Seg(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:490
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:487
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:477
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:469
Backward transform operator using sum-factorisation (Tet)
Definition: BwdTrans.cpp:832
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:946
BwdTrans_SumFac_Tet(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:965
Array< OneD, const NekDouble > m_base1
Definition: BwdTrans.cpp:960
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:959
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:938
Array< OneD, const NekDouble > m_base2
Definition: BwdTrans.cpp:961
Backward transform operator using sum-factorisation (Tri)
Definition: BwdTrans.cpp:621
void CheckFactors(StdRegions::FactorMap factors, int coll_phys_offset) override
Check the validity of the supplied factor map.
Definition: BwdTrans.cpp:672
BwdTrans_SumFac_Tri(vector< StdRegions::StdExpansionSharedPtr > pCollExp, CoalescedGeomDataSharedPtr pGeomData, StdRegions::FactorMap factors)
Definition: BwdTrans.cpp:688
Array< OneD, const NekDouble > m_base0
Definition: BwdTrans.cpp:683
Array< OneD, const NekDouble > m_base1
Definition: BwdTrans.cpp:684
void operator()(int dir, const Array< OneD, const NekDouble > &input, Array< OneD, NekDouble > &output, Array< OneD, NekDouble > &wsp) final
Definition: BwdTrans.cpp:664
unsigned int m_nElmtPad
size after padding
Array< OneD, NekDouble > m_input
padded input/output vectors
Base class for operators on a collection of elements.
Definition: Operator.h:133
StdRegions::StdExpansionSharedPtr m_stdExp
Definition: Operator.h:188
unsigned int m_numElmt
number of elements that the operator is applied on
Definition: Operator.h:190
unsigned int m_outputSize
number of modes or quadrature points that are taken as output from an operator
Definition: Operator.h:198
unsigned int m_inputSize
number of modes or quadrature points that are passed as input to an operator
Definition: Operator.h:195
tKey RegisterCreatorFunction(tKey idKey, CreatorFunction classCreator, std::string pDesc="")
Register a class with the factory.
Definition: NekFactory.hpp:197
tBaseSharedPtr CreateInstance(tKey idKey, tParam... args)
Create an instance of the class referred to by idKey.
Definition: NekFactory.hpp:143
static void Dgemm(const char &transa, const char &transb, const int &m, const int &n, const int &k, const double &alpha, const double *a, const int &lda, const double *b, const int &ldb, const double &beta, double *c, const int &ldc)
BLAS level 3: Matrix-matrix multiply C = A x B where op(A)[m x k], op(B)[k x n], C[m x n] DGEMM perfo...
Definition: Blas.hpp:383
static void Daxpy(const int &n, const double &alpha, const double *x, const int &incx, const double *y, const int &incy)
BLAS level 1: y = alpha x plus y.
Definition: Blas.hpp:135
std::tuple< LibUtilities::ShapeType, OperatorType, ImplementationType, ExpansionIsNodal > OperatorKey
Key for describing an Operator.
Definition: Operator.h:115
std::shared_ptr< CoalescedGeomData > CoalescedGeomDataSharedPtr
OperatorFactory & GetOperatorFactory()
Returns the singleton Operator factory object.
Definition: Operator.cpp:44
@ eModified_A
Principle Modified Functions .
Definition: BasisType.h:48
ConstFactorMap FactorMap
Definition: StdRegions.hpp:406
StdRegions::ConstFactorMap factors
std::shared_ptr< DNekMat > DNekMatSharedPtr
Definition: NekTypeDefs.hpp:75
double NekDouble
void Zero(int n, T *x, const int incx)
Zero vector.
Definition: Vmath.hpp:273
void Vcopy(int n, const T *x, const int incx, T *y, const int incy)
Definition: Vmath.hpp:825