doxygen/latest/_vmath_array_8hpp_source.html

///////////////////////////////////////////////////////////////////////////////

//

// File: VmathArray.hpp

//

// For more information, please see: http://www.nektar.info

//

// The MIT License

//

// Copyright (c) 2006 Division of Applied Mathematics, Brown University (USA),

// Department of Aeronautics, Imperial College London (UK), and Scientific

// Computing and Imaging Institute, University of Utah (USA).

//

// Permission is hereby granted, free of charge, to any person obtaining a

// copy of this software and associated documentation files (the "Software"),

// to deal in the Software without restriction, including without limitation

// the rights to use, copy, modify, merge, publish, distribute, sublicense,

// and/or sell copies of the Software, and to permit persons to whom the

// Software is furnished to do so, subject to the following conditions:

//

// The above copyright notice and this permission notice shall be included

// in all copies or substantial portions of the Software.

//

// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS

// OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,

// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL

// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER

// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING

// FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER

// DEALINGS IN THE SOFTWARE.

//

// Description: Wrappers around Vmath routines using Array<OneD,T> as arguments

//

///////////////////////////////////////////////////////////////////////////////


#ifndef NEKTAR_LIB_LIBUTILITIES_BASSICUTILS_VECTORMATHARRAY_HPP

#define NEKTAR_LIB_LIBUTILITIES_BASSICUTILS_VECTORMATHARRAY_HPP


#include <LibUtilities/BasicUtils/SharedArray.hpp>

#include <LibUtilities/BasicUtils/Vmath.hpp>

#include <LibUtilities/BasicUtils/VmathSIMD.hpp>


namespace Vmath

{

using namespace Nektar;


/***************** Math routines  ***************/

/// \brief Fill a vector with a constant value

template <class T>

void Fill(int n, const T alpha, Array<OneD, T> &x, const int incx)

{


    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Out of bounds");


    Fill(n, alpha, &x[0], incx);

}


template <class T>

void FillWhiteNoise(int n, const T eps, Array<OneD, T> &x, const int incx,

                    int outseed = 9999)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Out of bounds");


    FillWhiteNoise(n, eps, &x[0], incx, outseed);

}


/// \brief Multiply vector z = x*y

template <class T>

void Vmul(int n, const Array<OneD, const T> &x, [[maybe_unused]] const int incx,

          const Array<OneD, const T> &y, [[maybe_unused]] const int incy,

          Array<OneD, T> &z, [[maybe_unused]] const int incz)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    ASSERTL1(incx == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incy == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incz == 1, "Simd vmath requires inc = 1");

    SIMD::Vmul(n, &x[0], &y[0], &z[0]);

#else

    Vmul(n, &x[0], incx, &y[0], incy, &z[0], incz);

#endif

}


template <class T>

void Vmul(int n, const typename Array<TwoD, T>::const_reference &x,

          const int incx, const Array<OneD, const T> &y, const int incy,

          Array<OneD, T> &z, const int incz)

{

    ASSERTL1(n * incx <= x.size(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


    Vmul(n, x.origin(), incx, &y[0], incy, &z[0], incz);

}


/// \brief Scalar multiply  y = alpha*x


template <class T>

void Smul(int n, const T alpha, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{

    ASSERTL1(static_cast<unsigned int>(n * incx) <= x.size() + x.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(n * incy) <= y.size() + y.GetOffset(),

             "Array out of bounds");


    Smul(n, alpha, &x[0], incx, &y[0], incy);

}


/// \brief Multiply vector z = x/y

template <class T>

void Vdiv(int n, const Array<OneD, const T> &x, const int incx,

          const Array<OneD, const T> &y, const int incy, Array<OneD, T> &z,

          const int incz)

{

    ASSERTL1(static_cast<unsigned int>(n * incx) <= x.size() + x.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(n * incy) <= y.size() + y.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(n * incz) <= z.size() + z.GetOffset(),

             "Array out of bounds");


    Vdiv(n, &x[0], incx, &y[0], incy, &z[0], incz);

}


/// \brief Scalar multiply  y = alpha/x

template <class T>

void Sdiv(int n, const T alpha, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{

    ASSERTL1(static_cast<unsigned int>(n * incx) <= x.size() + x.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(n * incy) <= y.size() + y.GetOffset(),

             "Array out of bounds");


    Sdiv(n, alpha, &x[0], incx, &y[0], incy);

}


/// \brief Add vector z = x+y

template <class T>

void Vadd(int n, const Array<OneD, const T> &x, [[maybe_unused]] const int incx,

          const Array<OneD, const T> &y, [[maybe_unused]] const int incy,

          Array<OneD, T> &z, [[maybe_unused]] const int incz)

{

    ASSERTL1(static_cast<unsigned int>(n * incx) <= x.size() + x.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(n * incy) <= y.size() + y.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(n * incz) <= z.size() + z.GetOffset(),

             "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    ASSERTL1(incx == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incy == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incz == 1, "Simd vmath requires inc = 1");

    SIMD::Vadd(n, &x[0], &y[0], &z[0]);

#else

    Vadd(n, &x[0], incx, &y[0], incy, &z[0], incz);

#endif

}


/// \brief Add vector y = alpha + x

template <class T>

void Sadd(int n, const T alpha, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{


    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Sadd(n, alpha, &x[0], incx, &y[0], incy);

}


/// \brief Subtract vector z = x-y

template <class T>

void Vsub(int n, const Array<OneD, const T> &x, const int incx,

          const Array<OneD, const T> &y, const int incy, Array<OneD, T> &z,

          const int incz)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


    Vsub(n, &x[0], incx, &y[0], incy, &z[0], incz);

}


/// \brief Add vector y = alpha - x

template <class T>

void Ssub(int n, const T alpha, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{


    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Ssub(n, alpha, &x[0], incx, &y[0], incy);

}


/// \brief Zero vector

template <class T> void Zero(int n, Array<OneD, T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    Zero(n, &x[0], incx);

}


/// \brief Negate x = -x

template <class T> void Neg(int n, Array<OneD, T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    Neg(n, &x[0], incx);

}


/// \brief log y = log(x)

template <class T>

void Vlog(int n, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Vlog(n, &x[0], incx, &y[0], incy);

}


/// \brief exp y = exp(x)

template <class T>

void Vexp(int n, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Vexp(n, &x[0], incx, &y[0], incy);

}


/// \brief pow y = pow(x, f)

template <class T>

void Vpow(int n, const Array<OneD, const T> &x, const int incx, const T f,

          Array<OneD, T> &y, const int incy)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Vpow(n, &x[0], incx, f, &y[0], incy);

}


/// \brief sqrt y = sqrt(x)

template <class T>

void Vsqrt(int n, const Array<OneD, const T> &x, const int incx,

           Array<OneD, T> &y, const int incy)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Vsqrt(n, &x[0], incx, &y[0], incy);

}


/// \brief vabs: y = |x|

template <class T>

void Vabs(int n, const Array<OneD, const T> &x, const int incx,

          Array<OneD, T> &y, const int incy)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    Vabs(n, &x[0], incx, &y[0], incy);

}


/********** Triad  routines  ***********************/


/// \brief  vvtvp (vector times vector plus vector): z = w*x + y

template <class T>

void Vvtvp(int n, const Array<OneD, const T> &w,

           [[maybe_unused]] const int incw, const Array<OneD, const T> &x,

           [[maybe_unused]] const int incx, const Array<OneD, const T> &y,

           [[maybe_unused]] const int incy, Array<OneD, T> &z,

           [[maybe_unused]] const int incz)

{

    ASSERTL1(n * incw <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    ASSERTL1(incw == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incx == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incy == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incz == 1, "Simd vmath requires inc = 1");

    SIMD::Vvtvp(n, &w[0], &x[0], &y[0], &z[0]);

#else

    Vvtvp(n, &w[0], incw, &x[0], incx, &y[0], incy, &z[0], incz);

#endif

}


/// \brief  Vvtvp (vector times vector plus vector): z = w*x + y

template <class T>

void Vvtvp(int n, const typename Array<TwoD, T>::const_reference &w,

           const int incw, const Array<OneD, const T> &x, const int incx,

           const Array<OneD, const T> &y, const int incy, Array<OneD, T> &z,

           const int incz)

{

    ASSERTL1(n * incw <= w.size(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


    Vvtvp(n, w.origin(), incw, &x[0], incx, &y[0], incy, &z[0], incz);

}


/// \brief vvtvm (vector times vector minus vector): z = w*x - y

template <class T>

void Vvtvm(int n, const Array<OneD, const T> &w,

           [[maybe_unused]] const int incw, const Array<OneD, const T> &x,

           [[maybe_unused]] const int incx, const Array<OneD, const T> &y,

           [[maybe_unused]] const int incy, Array<OneD, T> &z,

           [[maybe_unused]] const int incz)

{

    ASSERTL1(n * incw <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    ASSERTL1(incw == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incx == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incy == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incz == 1, "Simd vmath requires inc = 1");

    SIMD::Vvtvm(n, &w[0], &x[0], &y[0], &z[0]);

#else

    Vvtvm(n, &w[0], incw, &x[0], incx, &y[0], incy, &z[0], incz);

#endif

}


/// \brief  svtvp (scalar times vector plus vector): z = alpha*x + y

template <class T>

void Svtvp(int n, const T alpha, const Array<OneD, const T> &x, const int incx,

           const Array<OneD, const T> &y, const int incy, Array<OneD, T> &z,

           const int incz)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


    Svtvp(n, alpha, &x[0], incx, &y[0], incy, &z[0], incz);

}


/// \brief  svtvm (scalar times vector minus vector): z = alpha*x - y

template <class T>

void Svtvm(int n, const T alpha, const Array<OneD, const T> &x, const int incx,

           const Array<OneD, const T> &y, const int incy, Array<OneD, T> &z,

           const int incz)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


    Svtvm(n, alpha, &x[0], incx, &y[0], incy, &z[0], incz);

}


/// \brief vvtvvtp (vector times vector plus vector times vector): z = v*w + x*y

template <class T>

void Vvtvvtp(int n, const Array<OneD, const T> &v, int incv,

             const Array<OneD, const T> &w, [[maybe_unused]] int incw,

             const Array<OneD, const T> &x, [[maybe_unused]] int incx,

             const Array<OneD, const T> &y, [[maybe_unused]] int incy,

             Array<OneD, T> &z, [[maybe_unused]] int incz)

{

    ASSERTL1(n * incv <= v.size() + v.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incw <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    ASSERTL1(incw == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incx == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incy == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incz == 1, "Simd vmath requires inc = 1");

    SIMD::Vvtvvtp(n, &v[0], &w[0], &x[0], &y[0], &z[0]);

#else

    Vvtvvtp(n, &v[0], incv, &w[0], incw, &x[0], incx, &y[0], incy, &z[0], incz);

#endif

}


/// \brief vvtvvtm (vector times vector minus vector times vector): z = v*w -

/// x*y

template <class T>

void Vvtvvtm(int n, const Array<OneD, const T> &v, [[maybe_unused]] int incv,

             const Array<OneD, const T> &w, [[maybe_unused]] int incw,

             const Array<OneD, const T> &x, [[maybe_unused]] int incx,

             const Array<OneD, const T> &y, [[maybe_unused]] int incy,

             Array<OneD, T> &z, [[maybe_unused]] int incz)

{

    ASSERTL1(n * incv <= v.size() + v.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incw <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    ASSERTL1(incw == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incx == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incy == 1, "Simd vmath requires inc = 1");

    ASSERTL1(incz == 1, "Simd vmath requires inc = 1");

    SIMD::Vvtvvtm(n, &v[0], &w[0], &x[0], &y[0], &z[0]);

#else

    Vvtvvtm(n, &v[0], incv, &w[0], incw, &x[0], incx, &y[0], incy, &z[0], incz);

#endif

}


/// \brief svtsvtp (scalar times vector plus scalar times vector): z = alpha*x +

/// beta*y

template <class T>

void Svtsvtp(int n, const T alpha, const Array<OneD, const T> &x,

             const int incx, const T beta, const Array<OneD, const T> &y,

             const int incy, Array<OneD, T> &z, const int incz)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incz <= z.size() + z.GetOffset(), "Array out of bounds");


    Svtsvtp(n, alpha, &x[0], incx, beta, &y[0], incy, &z[0], incz);

}


/************ Misc routine from Veclib (and extras)  ************/


/// \brief Gather vector z[i] = x[y[i]]

template <class T, class I,

          typename = typename std::enable_if<std::is_floating_point_v<T> &&

                                             std::is_integral_v<I>>::type>

void Gathr(I n, const Array<OneD, const T> &x, const Array<OneD, I> &y,

           Array<OneD, T> &z)

{

    ASSERTL1(n <= y.size() + y.GetOffset(), "Array out of bounds");

    ASSERTL1(n <= z.size() + z.GetOffset(), "Array out of bounds");


#ifdef NEKTAR_ENABLE_SIMD_VMATH

    SIMD::Gathr(n, &x[0], &y[0], &z[0]);

#else

    Gathr(n, &x[0], &y[0], &z[0]);

#endif

}


/// \brief Scatter vector z[y[i]] = x[i]

template <class T>

void Scatr(int n, const Array<OneD, const T> &x,

           const Array<OneD, const int> &y, Array<OneD, T> &z)

{

    ASSERTL1(n <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n <= y.size() + y.GetOffset(), "Array out of bounds");


    Scatr(n, &x[0], &y[0], &z[0]);

}


/// \brief Assemble z[y[i]] += x[i]; z should be zero'd first

template <class T>

void Assmb(int n, const Array<OneD, T> &x, const Array<OneD, int> &y,

           Array<OneD, T> &z)

{

    ASSERTL1(n <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n <= y.size() + y.GetOffset(), "Array out of bounds");


    Assmb(n, &x[0], &y[0], &z[0]);

}


/************* Reduction routines  *****************/


/// \brief Subtract return sum(x)

template <class T> T Vsum(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Vsum(n, &x[0], incx);

}


/// \brief Return the index of the maximum element in x

template <class T>

int Imax(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Imax(n, &x[0], incx);

}


/// \brief Return the maximum element in x -- called vmax to avoid

/// conflict with max

template <class T> T Vmax(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Vmax(n, &x[0], incx);

}


/// \brief Return the index of the maximum absolute element in x

template <class T>

int Iamax(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Iamax(n, &x[0], incx);

}


/// \brief Return the maximum absolute element in x

/// called vamax to avoid conflict with max

template <class T> T Vamax(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Vamax(n, &x[0], incx);

}


/// \brief Return the index of the minimum element in x

template <class T>

int Imin(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Imin(n, &x[0], incx);

}


/// \brief Return the minimum element in x - called vmin to avoid

/// conflict with min

template <class T> T Vmin(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Vmin(n, &x[0], incx);

}


/// \brief Return number of NaN elements of x

template <class T>

int Nnan(int n, const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Nnan(n, &x[0], incx);

}


/// \brief dot product

template <class T>

T Dot(int n, const Array<OneD, const T> &w, const Array<OneD, const T> &x)

{

    ASSERTL1(n <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n <= x.size() + x.GetOffset(), "Array out of bounds");


    return Dot(n, &w[0], &x[0]);

}


/// \brief dot product

template <class T>

T Dot(int n, const Array<OneD, const T> &w, const int incw,

      const Array<OneD, const T> &x, const int incx)

{

    ASSERTL1(n * incw <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");


    return Dot(n, &w[0], incw, &x[0], incx);

}


/// \brief dot product

template <class T>

T Dot2(int n, const Array<OneD, const T> &w, const Array<OneD, const T> &x,

       const Array<OneD, const int> &y)

{

    ASSERTL1(n <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n <= y.size() + y.GetOffset(), "Array out of bounds");


    return Dot2(n, &w[0], &x[0], &y[0]);

}


/// \brief dot product

template <class T>

T Ddot(int n, const Array<OneD, const T> &w, const int incw,

       const Array<OneD, const T> &x, const int incx,

       const Array<OneD, const int> &y, const int incy)

{

    ASSERTL1(n * incw <= w.size() + w.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incx <= x.size() + x.GetOffset(), "Array out of bounds");

    ASSERTL1(n * incy <= y.size() + y.GetOffset(), "Array out of bounds");


    return Dot2(n, &w[0], incw, &x[0], incx, &y[0], incy);

}


/********** Memory routines  ***********************/


// \brief copy one vector to another

template <class T>

void Vcopy(int n, const Array<OneD, const T> &x, int incx, Array<OneD, T> &y,

           int const incy)

{

    ASSERTL1(static_cast<unsigned int>(std::abs(n * incx)) <=

                 x.size() + x.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(std::abs(n * incy)) <=

                 y.size() + y.GetOffset(),

             "Array out of bounds");


    Vcopy(n, &x[0], incx, &y[0], incy);

}


// \brief reverse the ordering of  vector to another

template <class T>

void Reverse(int n, const Array<OneD, const T> &x, int incx, Array<OneD, T> &y,

             int const incy)

{

    ASSERTL1(static_cast<unsigned int>(std::abs(n * incx)) <=

                 x.size() + x.GetOffset(),

             "Array out of bounds");

    ASSERTL1(static_cast<unsigned int>(std::abs(n * incy)) <=

                 y.size() + y.GetOffset(),

             "Array out of bounds");


    Reverse(n, &x[0], incx, &y[0], incy);

}


} // namespace Vmath

#endif // VECTORMATHARRAY_HPP

SharedArray.hpp

ASSERTL1
#define ASSERTL1(condition, msg)
Assert Level 1 – Debugging which is used whether in FULLDEBUG or DEBUG compilation mode....
Definition: ErrorUtil.hpp:242

Vmath.hpp

VmathSIMD.hpp

Nektar::Array
Definition: BasicUtils/SharedArray.hpp:57

Nektar::LibUtilities::beta
@ beta
Gauss Radau pinned at x=-1,.
Definition: PointsType.h:59

Nektar::UnitTests::w
std::vector< double > w(NPUPPER)

Nektar::UnitTests::z
std::vector< double > z(NPUPPER)

Nektar
Definition: CoupledSolver.h:2

Vmath::SIMD::Vvtvp
void Vvtvp(const size_t n, const T *w, const T *x, const T *y, T *z)
vvtvp (vector times vector plus vector): z = w*x + y
Definition: VmathSIMD.hpp:259

Vmath::SIMD::Vadd
void Vadd(const size_t n, const T *x, const T *y, T *z)
Add vector z = x + y.
Definition: VmathSIMD.hpp:47

Vmath::SIMD::Vvtvm
void Vvtvm(const size_t n, const T *w, const T *x, const T *y, T *z)
vvtvm (vector times vector minus vector): z = w*x - y
Definition: VmathSIMD.hpp:307

Vmath::SIMD::Vvtvvtm
void Vvtvvtm(const size_t n, const T *v, const T *w, const T *x, const T *y, T *z)
vvtvvtm (vector times vector minus vector times vector):
Definition: VmathSIMD.hpp:414

Vmath::SIMD::Gathr
void Gathr(const I n, const T *x, const I *y, T *z)
Gather vector z[i] = x[y[i]].
Definition: VmathSIMD.hpp:472

Vmath::SIMD::Vvtvvtp
void Vvtvvtp(const size_t n, const T *v, const T *w, const T *x, const T *y, T *z)
vvtvvtp (vector times vector plus vector times vector):
Definition: VmathSIMD.hpp:356

Vmath::SIMD::Vmul
void Vmul(const size_t n, const T *x, const T *y, T *z)
Multiply vector z = x * y.
Definition: VmathSIMD.hpp:153

Vmath
Definition: Vmath.cpp:38

Vmath::Vsqrt
void Vsqrt(int n, const T *x, const int incx, T *y, const int incy)
sqrt y = sqrt(x)
Definition: Vmath.hpp:340

Vmath::Ssub
void Ssub(int n, const T alpha, const T *x, const int incx, T *y, const int incy)
Substract vector y = alpha - x.
Definition: Vmath.hpp:248

Vmath::Svtsvtp
void Svtsvtp(int n, const T alpha, const T *x, int incx, const T beta, const T *y, int incy, T *z, int incz)
Svtsvtp (scalar times vector plus scalar times vector):
Definition: Vmath.hpp:473

Vmath::Vmul
void Vmul(int n, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Multiply vector z = x*y.
Definition: Vmath.hpp:72

Vmath::Gathr
void Gathr(I n, const T *x, const I *y, T *z)
Gather vector z[i] = x[y[i]].
Definition: Vmath.hpp:507

Vmath::Vlog
void Vlog(int n, const T *x, const int incx, T *y, const int incy)
log y = log(x)
Definition: Vmath.hpp:303

Vmath::Vexp
void Vexp(int n, const T *x, const int incx, T *y, const int incy)
exp y = exp(x)
Definition: Vmath.hpp:315

Vmath::Svtvp
void Svtvp(int n, const T alpha, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Svtvp (scalar times vector plus vector): z = alpha*x + y.
Definition: Vmath.hpp:396

Vmath::Vabs
void Vabs(int n, const T *x, const int incx, T *y, const int incy)
vabs: y = |x|
Definition: Vmath.hpp:352

Vmath::Dot2
T Dot2(int n, const T *w, const T *x, const int *y)
dot product
Definition: Vmath.hpp:790

Vmath::Neg
void Neg(int n, T *x, const int incx)
Negate x = -x.
Definition: Vmath.hpp:292

Vmath::Vmin
T Vmin(int n, const T *x, const int incx)
Return the minimum element in x - called vmin to avoid conflict with min.
Definition: Vmath.hpp:725

Vmath::Ddot
T Ddot(int n, const Array< OneD, const T > &w, const int incw, const Array< OneD, const T > &x, const int incx, const Array< OneD, const int > &y, const int incy)
dot product
Definition: VmathArray.hpp:577

Vmath::Vvtvp
void Vvtvp(int n, const T *w, const int incw, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
vvtvp (vector times vector plus vector): z = w*x + y
Definition: Vmath.hpp:366

Vmath::Vsum
T Vsum(int n, const T *x, const int incx)
Subtract return sum(x)
Definition: Vmath.hpp:608

Vmath::Scatr
void Scatr(int n, const T *x, const int *y, T *z)
Scatter vector z[y[i]] = x[i].
Definition: Vmath.hpp:539

Vmath::Dot
T Dot(int n, const T *w, const T *x)
dot product
Definition: Vmath.hpp:761

Vmath::Assmb
void Assmb(int n, const T *x, const int *y, T *z)
Assemble z[y[i]] += x[i]; z should be zero'd first.
Definition: Vmath.hpp:577

Vmath::Svtvm
void Svtvm(int n, const T alpha, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Svtvm (scalar times vector minus vector): z = alpha*x - y.
Definition: Vmath.hpp:424

Vmath::Vadd
void Vadd(int n, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Add vector z = x+y.
Definition: Vmath.hpp:180

Vmath::Vvtvm
void Vvtvm(int n, const T *w, const int incw, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
vvtvm (vector times vector minus vector): z = w*x - y
Definition: Vmath.hpp:381

Vmath::Vvtvvtm
void Vvtvvtm(int n, const T *v, int incv, const T *w, int incw, const T *x, int incx, const T *y, int incy, T *z, int incz)
vvtvvtm (vector times vector minus vector times vector):
Definition: Vmath.hpp:456

Vmath::Smul
void Smul(int n, const T alpha, const T *x, const int incx, T *y, const int incy)
Scalar multiply y = alpha*x.
Definition: Vmath.hpp:100

Vmath::Sdiv
void Sdiv(int n, const T alpha, const T *x, const int incx, T *y, const int incy)
Scalar multiply y = alpha/x.
Definition: Vmath.hpp:154

Vmath::Imax
int Imax(int n, const T *x, const int incx)
Return the index of the maximum element in x.
Definition: Vmath.hpp:623

Vmath::Vdiv
void Vdiv(int n, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Multiply vector z = x/y.
Definition: Vmath.hpp:126

Vmath::Imin
int Imin(int n, const T *x, const int incx)
Return the index of the minimum element in x.
Definition: Vmath.hpp:704

Vmath::Zero
void Zero(int n, T *x, const int incx)
Zero vector.
Definition: Vmath.hpp:273

Vmath::Fill
void Fill(int n, const T alpha, T *x, const int incx)
Fill a vector with a constant value.
Definition: Vmath.hpp:54

Vmath::FillWhiteNoise
void FillWhiteNoise(int n, const T eps, T *x, const int incx, int outseed)
Fills a vector with white noise.
Definition: Vmath.cpp:154

Vmath::Nnan
int Nnan(int n, const T *x, const int incx)
Return number of NaN elements of x.
Definition: Vmath.hpp:743

Vmath::Vamax
T Vamax(int n, const T *x, const int incx)
Return the maximum absolute element in x called vamax to avoid conflict with max.
Definition: Vmath.hpp:685

Vmath::Sadd
void Sadd(int n, const T alpha, const T *x, const int incx, T *y, const int incy)
Add vector y = alpha + x.
Definition: Vmath.hpp:194

Vmath::Reverse
void Reverse(int n, const T *x, const int incx, T *y, const int incy)
Definition: Vmath.hpp:844

Vmath::Vmax
T Vmax(int n, const T *x, const int incx)
Return the maximum element in x – called vmax to avoid conflict with max.
Definition: Vmath.hpp:644

Vmath::Vvtvvtp
void Vvtvvtp(int n, const T *v, int incv, const T *w, int incw, const T *x, int incx, const T *y, int incy, T *z, int incz)
vvtvvtp (vector times vector plus vector times vector):
Definition: Vmath.hpp:439

Vmath::Vcopy
void Vcopy(int n, const T *x, const int incx, T *y, const int incy)
Definition: Vmath.hpp:825

Vmath::Vsub
void Vsub(int n, const T *x, const int incx, const T *y, const int incy, T *z, const int incz)
Subtract vector z = x-y.
Definition: Vmath.hpp:220

Vmath::Vpow
void Vpow(int n, const T *x, const int incx, const T f, T *y, const int incy)
pow y = pow(x, f)
Definition: Vmath.hpp:327

Vmath::Iamax
int Iamax(int n, const T *x, const int incx)
Return the index of the maximum absolute element in x.
Definition: Vmath.hpp:662

tinysimd::abs
scalarT< T > abs(scalarT< T > in)
Definition: scalar.hpp:289