doc/v606/avx_2math_8h_source.html

 /*  This file is part of the Vc library.


     Copyright (C) 2009-2012 Matthias Kretz <kretz@kde.org>


     Vc is free software: you can redistribute it and/or modify

     it under the terms of the GNU Lesser General Public License as

     published by the Free Software Foundation, either version 3 of

     the License, or (at your option) any later version.


     Vc is distributed in the hope that it will be useful, but

     WITHOUT ANY WARRANTY; without even the implied warranty of

     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

     GNU Lesser General Public License for more details.


     You should have received a copy of the GNU Lesser General Public

     License along with Vc.  If not, see <http://www.gnu.org/licenses/>.


 */


 #ifndef VC_AVX_MATH_H

 #define VC_AVX_MATH_H


 #include "const.h"

 #include "limits.h"

 #include "macros.h"


 namespace ROOT {

 namespace Vc

 {

 namespace AVX

 {

     /**

      * splits \p v into exponent and mantissa, the sign is kept with the mantissa

      *

      * The return value will be in the range [0.5, 1.0[

      * The \p e value will be an integer defining the power-of-two exponent

      */

     inline double_v frexp(double_v::AsArg v, int_v *e) {

         const m256d exponentBits = Const<double>::exponentMask().dataD();

         const m256d exponentPart = _mm256_and_pd(v.data(), exponentBits);

         e->data() = _mm256_sub_epi32(_mm256_srli_epi64(avx_cast<m256i>(exponentPart), 52), _mm256_set1_epi32(0x3fe));

         const m256d exponentMaximized = _mm256_or_pd(v.data(), exponentBits);

         double_v ret = _mm256_and_pd(exponentMaximized, _mm256_broadcast_sd(reinterpret_cast<const double *>(&c_general::frexpMask)));

         double_m zeroMask = v == double_v::Zero();

         ret(isnan(v) || !isfinite(v) || zeroMask) = v;

         e->setZero(zeroMask.data());

         return ret;

     }

     inline float_v frexp(float_v::AsArg v, int_v *e) {

         const m256 exponentBits = Const<float>::exponentMask().data();

         const m256 exponentPart = _mm256_and_ps(v.data(), exponentBits);

         e->data() = _mm256_sub_epi32(_mm256_srli_epi32(avx_cast<m256i>(exponentPart), 23), _mm256_set1_epi32(0x7e));

         const m256 exponentMaximized = _mm256_or_ps(v.data(), exponentBits);

         float_v ret = _mm256_and_ps(exponentMaximized, avx_cast<m256>(_mm256_set1_epi32(0xbf7fffffu)));

         ret(isnan(v) || !isfinite(v) || v == float_v::Zero()) = v;

         e->setZero(v == float_v::Zero());

         return ret;

     }

     inline sfloat_v frexp(sfloat_v::AsArg v, short_v *e) {

         const m256 exponentBits = Const<float>::exponentMask().data();

         const m256 exponentPart = _mm256_and_ps(v.data(), exponentBits);

         e->data() = _mm_sub_epi16(_mm_packs_epi32(_mm_srli_epi32(avx_cast<m128i>(exponentPart), 23),

                     _mm_srli_epi32(avx_cast<m128i>(hi128(exponentPart)), 23)), _mm_set1_epi16(0x7e));

         const m256 exponentMaximized = _mm256_or_ps(v.data(), exponentBits);

         sfloat_v ret = _mm256_and_ps(exponentMaximized, avx_cast<m256>(_mm256_set1_epi32(0xbf7fffffu)));

         ret(isnan(v) || !isfinite(v) || v == sfloat_v::Zero()) = v;

         e->setZero(v == sfloat_v::Zero());

         return ret;

     }


     /*             -> x * 2^e

      * x == NaN    -> NaN

      * x == (-)inf -> (-)inf

      */

     inline double_v ldexp(double_v::AsArg v, int_v::AsArg _e) {

         int_v e = _e;

         e.setZero((v == double_v::Zero()).dataI());

         const m256i exponentBits = _mm256_slli_epi64(e.data(), 52);

         return avx_cast<m256d>(_mm256_add_epi64(avx_cast<m256i>(v.data()), exponentBits));

     }

     inline float_v ldexp(float_v::AsArg v, int_v::AsArg _e) {

         int_v e = _e;

         e.setZero(static_cast<int_m>(v == float_v::Zero()));

         return (v.reinterpretCast<int_v>() + (e << 23)).reinterpretCast<float_v>();

     }

     inline sfloat_v ldexp(sfloat_v::AsArg v, short_v::AsArg _e) {

         short_v e = _e;

         e.setZero(static_cast<short_m>(v == sfloat_v::Zero()));

         e = e << (23 - 16);

         const m256i exponentBits = concat(_mm_unpacklo_epi16(_mm_setzero_si128(), e.data()),

                 _mm_unpackhi_epi16(_mm_setzero_si128(), e.data()));

         return (v.reinterpretCast<int_v>() + int_v(exponentBits)).reinterpretCast<sfloat_v>();

     }


     static Vc_ALWAYS_INLINE  float_v trunc( float_v::AsArg v) { return _mm256_round_ps(v.data(), 0x3); }

     static Vc_ALWAYS_INLINE sfloat_v trunc(sfloat_v::AsArg v) { return _mm256_round_ps(v.data(), 0x3); }

     static Vc_ALWAYS_INLINE double_v trunc(double_v::AsArg v) { return _mm256_round_pd(v.data(), 0x3); }


     static Vc_ALWAYS_INLINE float_v floor(float_v::AsArg v) { return _mm256_floor_ps(v.data()); }

     static Vc_ALWAYS_INLINE sfloat_v floor(sfloat_v::AsArg v) { return _mm256_floor_ps(v.data()); }

     static Vc_ALWAYS_INLINE double_v floor(double_v::AsArg v) { return _mm256_floor_pd(v.data()); }


     static Vc_ALWAYS_INLINE float_v ceil(float_v::AsArg v) { return _mm256_ceil_ps(v.data()); }

     static Vc_ALWAYS_INLINE sfloat_v ceil(sfloat_v::AsArg v) { return _mm256_ceil_ps(v.data()); }

     static Vc_ALWAYS_INLINE double_v ceil(double_v::AsArg v) { return _mm256_ceil_pd(v.data()); }

 } // namespace AVX

 } // namespace Vc

 } // namespace ROOT


 #include "undomacros.h"

 #define VC__USE_NAMESPACE AVX

 #include "../common/trigonometric.h"

 #define VC__USE_NAMESPACE AVX

 #include "../common/logarithm.h"

 #define VC__USE_NAMESPACE AVX

 #include "../common/exponential.h"

 #undef VC__USE_NAMESPACE


 #endif // VC_AVX_MATH_H

ROOT::Vc::AVX::sfloat_v
Vector< sfloat > sfloat_v
Definition: vector.h:418

macros.h

ROOT::Vc::sfloat_v
VECTOR_NAMESPACE::sfloat_v sfloat_v
Definition: vector.h:82

ROOT::Vc::AVX::ldexp
double_v ldexp(double_v::AsArg v, int_v::AsArg _e)
Definition: math.h:75

ROOT
Namespace for new ROOT classes and functions.
Definition: ROOT.py:1

ROOT::Vc::AVX::trunc
static Vc_ALWAYS_INLINE float_v trunc(float_v::AsArg v)
Definition: math.h:95

ROOT::Vc::AVX::avx_cast
static Vc_INTRINSIC_L T avx_cast(param128 v) Vc_INTRINSIC_R
Definition: casts.h:49

ROOT::Vc::AVX::Mask< Size, sizeof(VectorType)>

ROOT::Vc::AVX::Vector
Definition: const.h:32

ROOT::Vc::AVX::short_v
Vector< short > short_v
Definition: vector.h:421

ROOT::Vc::AVX::m256d
__m256d m256d
Definition: intrinsics.h:114

ROOT::Vc::AVX::hi128
Vc_INTRINSIC Vc_CONST m128 hi128(param256 v)
Definition: casts.h:118

ROOT::Vc::AVX::isfinite
static Vc_ALWAYS_INLINE Vector< T >::Mask isfinite(const Vector< T > &x)
Definition: vector.h:454

ROOT::Vc::AVX::Vector::setZero
Vc_INTRINSIC_L void setZero() Vc_INTRINSIC_R

ROOT::Vc::AVX::frexp
double_v frexp(double_v::AsArg v, int_v *e)
splits v into exponent and mantissa, the sign is kept with the mantissa
Definition: math.h:38

limits.h

ROOT::Vc::AVX::concat
Vc_INTRINSIC Vc_CONST m256 concat(param128 a, param128 b)
Definition: casts.h:123

ROOT::Vc::AVX::floor
static Vc_ALWAYS_INLINE float_v floor(float_v::AsArg v)
Definition: math.h:99

ROOT::Vc::AVX::ceil
static Vc_ALWAYS_INLINE float_v ceil(float_v::AsArg v)
Definition: math.h:103

ROOT::Vc::AVX::Vector::Zero
static Vc_INTRINSIC_L Vc_CONST_L Vector Zero() Vc_INTRINSIC_R Vc_CONST_R

AVX
#define AVX
Definition: global.h:90

ROOT::Vc::int_v
VECTOR_NAMESPACE::int_v int_v
Definition: vector.h:86

ROOT::Vc::AVX::double_v
Vector< double > double_v
Definition: vector.h:416

v
SVector< double, 2 > v
Definition: Dict.h:5

ROOT::Vc::AVX::m256i
__m256i m256i
Definition: intrinsics.h:115

const.h

undomacros.h

ROOT::Vc::AVX::isnan
static Vc_ALWAYS_INLINE Vector< T >::Mask isnan(const Vector< T > &x)
Definition: vector.h:455

Vc_ALWAYS_INLINE
#define Vc_ALWAYS_INLINE
Definition: macros.h:130

ROOT::Vc::AVX::Vector::AsArg
Vector< T > AsArg
Definition: vector.h:67

ROOT::Vc::AVX::m256
__m256 m256
Definition: intrinsics.h:113

ROOT::Vc::AVX::_mm256_set1_epi32
static Vc_INTRINSIC m256i Vc_CONST _mm256_set1_epi32(int a)
Definition: intrinsics.h:157

ROOT::Vc::float_v
VECTOR_NAMESPACE::float_v float_v
Definition: vector.h:84

ROOT::Vc::AVX::int_v
Vector< int > int_v
Definition: vector.h:419

ROOT::Vc
Definition: casts.h:28

ROOT::Vc::AVX::Const::exponentMask
static Vc_ALWAYS_INLINE Vc_CONST M exponentMask()
Definition: const.h:88

ROOT::Vc::AVX::Vector::data
Vc_ALWAYS_INLINE VectorType & data()
Definition: vector.h:322