doxygen/html/m256_8hpp_source.html

// Copyright (c) 2010-2024, Lawrence Livermore National Security, LLC. Produced

// at the Lawrence Livermore National Laboratory. All Rights reserved. See files

// LICENSE and NOTICE for details. LLNL-CODE-806117.

//

// This file is part of the MFEM library. For more information and source code

// availability visit https://mfem.org.

//

// MFEM is free software; you can redistribute it and/or modify it under the

// terms of the BSD-3 license. We welcome feedback and contributions, see file

// CONTRIBUTING.md for details.


#ifndef MFEM_SIMD_M256_HPP

#define MFEM_SIMD_M256_HPP


#ifdef __AVX__


#include "../../config/tconfig.hpp"

#if defined(__x86_64__)

#include <x86intrin.h>

#else // assuming MSVC with _M_X64 or _M_IX86

#include <intrin.h>

#endif


namespace mfem

{


template <typename, int, int> struct AutoSIMD;


template <> struct AutoSIMD<double,4,32>

{

   typedef double scalar_type;

   static constexpr int size = 4;

   static constexpr int align_bytes = 32;


   union

   {

      __m256d m256d;

      double vec[size];

   };


   AutoSIMD() = default;


   AutoSIMD(const AutoSIMD &) = default;


   inline MFEM_ALWAYS_INLINE double &operator[](int i)

   {

      return vec[i];

   }


   inline MFEM_ALWAYS_INLINE const double &operator[](int i) const

   {

      return vec[i];

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator=(const AutoSIMD &v)

   {

      m256d = v.m256d;

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator=(const double &e)

   {

      m256d = _mm256_set1_pd(e);

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator+=(const AutoSIMD &v)

   {

      m256d = _mm256_add_pd(m256d,v.m256d);

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator+=(const double &e)

   {

      m256d = _mm256_add_pd(m256d,_mm256_set1_pd(e));

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator-=(const AutoSIMD &v)

   {

      m256d = _mm256_sub_pd(m256d,v.m256d);

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator-=(const double &e)

   {

      m256d = _mm256_sub_pd(m256d,_mm256_set1_pd(e));

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator*=(const AutoSIMD &v)

   {

      m256d = _mm256_mul_pd(m256d,v.m256d);

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator*=(const double &e)

   {

      m256d = _mm256_mul_pd(m256d,_mm256_set1_pd(e));

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator/=(const AutoSIMD &v)

   {

      m256d = _mm256_div_pd(m256d,v.m256d);

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &operator/=(const double &e)

   {

      m256d = _mm256_div_pd(m256d,_mm256_set1_pd(e));

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator-() const

   {

      AutoSIMD r;

      r.m256d = _mm256_xor_pd(_mm256_set1_pd(-0.0), m256d);

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator+() const

   {

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator+(const AutoSIMD &v) const

   {

      AutoSIMD r;

      r.m256d = _mm256_add_pd(m256d,v.m256d);

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator+(const double &e) const

   {

      AutoSIMD r;

      r.m256d = _mm256_add_pd(m256d, _mm256_set1_pd(e));

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator-(const AutoSIMD &v) const

   {

      AutoSIMD r;

      r.m256d = _mm256_sub_pd(m256d,v.m256d);

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator-(const double &e) const

   {

      AutoSIMD r;

      r.m256d = _mm256_sub_pd(m256d, _mm256_set1_pd(e));

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator*(const AutoSIMD &v) const

   {

      AutoSIMD r;

      r.m256d = _mm256_mul_pd(m256d,v.m256d);

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator*(const double &e) const

   {

      AutoSIMD r;

      r.m256d = _mm256_mul_pd(m256d, _mm256_set1_pd(e));

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator/(const AutoSIMD &v) const

   {

      AutoSIMD r;

      r.m256d = _mm256_div_pd(m256d,v.m256d);

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD operator/(const double &e) const

   {

      AutoSIMD r;

      r.m256d = _mm256_div_pd(m256d, _mm256_set1_pd(e));

      return r;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &fma(const AutoSIMD &v, const AutoSIMD &w)

   {

#ifndef __AVX2__

      m256d = _mm256_add_pd(_mm256_mul_pd(w.m256d,v.m256d),m256d);

#else

      m256d = _mm256_fmadd_pd(w.m256d,v.m256d,m256d);

#endif

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &fma(const AutoSIMD &v, const double &e)

   {

#ifndef __AVX2__

      m256d = _mm256_add_pd(_mm256_mul_pd(_mm256_set1_pd(e),v.m256d),m256d);

#else

      m256d = _mm256_fmadd_pd(_mm256_set1_pd(e),v.m256d,m256d);

#endif

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &fma(const double &e, const AutoSIMD &v)

   {

#ifndef __AVX2__

      m256d = _mm256_add_pd(_mm256_mul_pd(v.m256d,_mm256_set1_pd(e)),m256d);

#else

      m256d = _mm256_fmadd_pd(v.m256d,_mm256_set1_pd(e),m256d);

#endif

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &mul(const AutoSIMD &v, const AutoSIMD &w)

   {

      m256d = _mm256_mul_pd(v.m256d,w.m256d);

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &mul(const AutoSIMD &v, const double &e)

   {

      m256d = _mm256_mul_pd(v.m256d,_mm256_set1_pd(e));

      return *this;

   }


   inline MFEM_ALWAYS_INLINE AutoSIMD &mul(const double &e, const AutoSIMD &v)

   {

      m256d = _mm256_mul_pd(_mm256_set1_pd(e),v.m256d);

      return *this;

   }

};


inline MFEM_ALWAYS_INLINE

AutoSIMD<double,4,32> operator+(const double &e,

                                const AutoSIMD<double,4,32> &v)

{

   AutoSIMD<double,4,32> r;

   r.m256d = _mm256_add_pd(_mm256_set1_pd(e),v.m256d);

   return r;

}


inline MFEM_ALWAYS_INLINE

AutoSIMD<double,4,32> operator-(const double &e,

                                const AutoSIMD<double,4,32> &v)

{

   AutoSIMD<double,4,32> r;

   r.m256d = _mm256_sub_pd(_mm256_set1_pd(e),v.m256d);

   return r;

}


inline MFEM_ALWAYS_INLINE

AutoSIMD<double,4,32> operator*(const double &e,

                                const AutoSIMD<double,4,32> &v)

{

   AutoSIMD<double,4,32> r;

   r.m256d = _mm256_mul_pd(_mm256_set1_pd(e),v.m256d);

   return r;

}


inline MFEM_ALWAYS_INLINE

AutoSIMD<double,4,32> operator/(const double &e,

                                const AutoSIMD<double,4,32> &v)

{

   AutoSIMD<double,4,32> r;

   r.m256d = _mm256_div_pd(_mm256_set1_pd(e),v.m256d);

   return r;

}


} // namespace mfem


#endif // __AVX__


#endif // MFEM_SIMD_M256_HPP

mfem
Definition: CodeDocumentation.dox:1

mfem::operator*
MemoryClass operator*(MemoryClass mc1, MemoryClass mc2)
Return a suitable MemoryClass from a pair of MemoryClasses.
Definition: mem_manager.cpp:130

mfem::operator+
MFEM_ALWAYS_INLINE AutoSIMD< scalar_t, S, A > operator+(const scalar_t &e, const AutoSIMD< scalar_t, S, A > &v)
Definition: auto.hpp:238

mfem::operator-
MFEM_ALWAYS_INLINE AutoSIMD< scalar_t, S, A > operator-(const scalar_t &e, const AutoSIMD< scalar_t, S, A > &v)
Definition: auto.hpp:249

mfem::operator/
MFEM_ALWAYS_INLINE AutoSIMD< scalar_t, S, A > operator/(const scalar_t &e, const AutoSIMD< scalar_t, S, A > &v)
Definition: auto.hpp:271

mfem::AutoSIMD< double, 4, 32 >::operator=
MFEM_ALWAYS_INLINE AutoSIMD & operator=(const double &e)
Definition: m256.hpp:61

mfem::AutoSIMD< double, 4, 32 >::operator*
MFEM_ALWAYS_INLINE AutoSIMD operator*(const double &e) const
Definition: m256.hpp:162

mfem::AutoSIMD< double, 4, 32 >::operator[]
MFEM_ALWAYS_INLINE const double & operator[](int i) const
Definition: m256.hpp:50

mfem::AutoSIMD< double, 4, 32 >::fma
MFEM_ALWAYS_INLINE AutoSIMD & fma(const double &e, const AutoSIMD &v)
Definition: m256.hpp:203

mfem::AutoSIMD< double, 4, 32 >::operator/
MFEM_ALWAYS_INLINE AutoSIMD operator/(const AutoSIMD &v) const
Definition: m256.hpp:169

mfem::AutoSIMD< double, 4, 32 >::operator/
MFEM_ALWAYS_INLINE AutoSIMD operator/(const double &e) const
Definition: m256.hpp:176

mfem::AutoSIMD< double, 4, 32 >::AutoSIMD
AutoSIMD(const AutoSIMD &)=default

mfem::AutoSIMD< double, 4, 32 >::operator+=
MFEM_ALWAYS_INLINE AutoSIMD & operator+=(const AutoSIMD &v)
Definition: m256.hpp:67

mfem::AutoSIMD< double, 4, 32 >::operator*
MFEM_ALWAYS_INLINE AutoSIMD operator*(const AutoSIMD &v) const
Definition: m256.hpp:155

mfem::AutoSIMD< double, 4, 32 >::operator/=
MFEM_ALWAYS_INLINE AutoSIMD & operator/=(const double &e)
Definition: m256.hpp:109

mfem::AutoSIMD< double, 4, 32 >::scalar_type
double scalar_type
Definition: m256.hpp:31

mfem::AutoSIMD< double, 4, 32 >::operator-=
MFEM_ALWAYS_INLINE AutoSIMD & operator-=(const AutoSIMD &v)
Definition: m256.hpp:79

mfem::AutoSIMD< double, 4, 32 >::m256d
__m256d m256d
Definition: m256.hpp:37

mfem::AutoSIMD< double, 4, 32 >::operator+
MFEM_ALWAYS_INLINE AutoSIMD operator+(const double &e) const
Definition: m256.hpp:134

mfem::AutoSIMD< double, 4, 32 >::operator*=
MFEM_ALWAYS_INLINE AutoSIMD & operator*=(const AutoSIMD &v)
Definition: m256.hpp:91

mfem::AutoSIMD< double, 4, 32 >::mul
MFEM_ALWAYS_INLINE AutoSIMD & mul(const AutoSIMD &v, const double &e)
Definition: m256.hpp:219

mfem::AutoSIMD< double, 4, 32 >::operator/=
MFEM_ALWAYS_INLINE AutoSIMD & operator/=(const AutoSIMD &v)
Definition: m256.hpp:103

mfem::AutoSIMD< double, 4, 32 >::operator=
MFEM_ALWAYS_INLINE AutoSIMD & operator=(const AutoSIMD &v)
Definition: m256.hpp:55

mfem::AutoSIMD< double, 4, 32 >::operator*=
MFEM_ALWAYS_INLINE AutoSIMD & operator*=(const double &e)
Definition: m256.hpp:97

mfem::AutoSIMD< double, 4, 32 >::operator-
MFEM_ALWAYS_INLINE AutoSIMD operator-(const double &e) const
Definition: m256.hpp:148

mfem::AutoSIMD< double, 4, 32 >::fma
MFEM_ALWAYS_INLINE AutoSIMD & fma(const AutoSIMD &v, const AutoSIMD &w)
Definition: m256.hpp:183

mfem::AutoSIMD< double, 4, 32 >::operator[]
MFEM_ALWAYS_INLINE double & operator[](int i)
Definition: m256.hpp:45

mfem::AutoSIMD< double, 4, 32 >::fma
MFEM_ALWAYS_INLINE AutoSIMD & fma(const AutoSIMD &v, const double &e)
Definition: m256.hpp:193

mfem::AutoSIMD< double, 4, 32 >::operator-
MFEM_ALWAYS_INLINE AutoSIMD operator-() const
Definition: m256.hpp:115

mfem::AutoSIMD< double, 4, 32 >::operator-
MFEM_ALWAYS_INLINE AutoSIMD operator-(const AutoSIMD &v) const
Definition: m256.hpp:141

mfem::AutoSIMD< double, 4, 32 >::operator+
MFEM_ALWAYS_INLINE AutoSIMD operator+(const AutoSIMD &v) const
Definition: m256.hpp:127

mfem::AutoSIMD< double, 4, 32 >::operator-=
MFEM_ALWAYS_INLINE AutoSIMD & operator-=(const double &e)
Definition: m256.hpp:85

mfem::AutoSIMD< double, 4, 32 >::mul
MFEM_ALWAYS_INLINE AutoSIMD & mul(const AutoSIMD &v, const AutoSIMD &w)
Definition: m256.hpp:213

mfem::AutoSIMD< double, 4, 32 >::mul
MFEM_ALWAYS_INLINE AutoSIMD & mul(const double &e, const AutoSIMD &v)
Definition: m256.hpp:225

mfem::AutoSIMD< double, 4, 32 >::operator+=
MFEM_ALWAYS_INLINE AutoSIMD & operator+=(const double &e)
Definition: m256.hpp:73

mfem::AutoSIMD< double, 4, 32 >::operator+
MFEM_ALWAYS_INLINE AutoSIMD operator+() const
Definition: m256.hpp:122

mfem::AutoSIMD< double, 4, 32 >::AutoSIMD
AutoSIMD()=default

mfem::AutoSIMD
Definition: auto.hpp:25

mfem::AutoSIMD::vec
scalar_t vec[size]
Definition: auto.hpp:30

mfem::AutoSIMD::size
static const int size
Definition: auto.hpp:27

mfem::AutoSIMD::align_bytes
static const int align_bytes
Definition: auto.hpp:28