root/html606/arithmetics_8cpp_source.html

 /*  This file is part of the Vc library.


     Copyright (C) 2009-2012 Matthias Kretz <kretz@kde.org>


     Vc is free software: you can redistribute it and/or modify

     it under the terms of the GNU Lesser General Public License as

     published by the Free Software Foundation, either version 3 of

     the License, or (at your option) any later version.


     Vc is distributed in the hope that it will be useful, but

     WITHOUT ANY WARRANTY; without even the implied warranty of

     MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

     GNU Lesser General Public License for more details.


     You should have received a copy of the GNU Lesser General Public

     License along with Vc.  If not, see <http://www.gnu.org/licenses/>.


 */


 #include "unittest.h"

 #include <iostream>

 #include <limits>

 #include <Vc/limits>

 #include <Vc/common/macros.h>


 using namespace Vc;


 template<typename Vec> void testZero()

 {

     Vec a(Zero), b(Zero);

     COMPARE(a, b);

     Vec c, d(1);

     c.setZero();

     COMPARE(a, c);

     d.setZero();

     COMPARE(a, d);

     d = static_cast<typename Vec::EntryType>(0);

     COMPARE(a, d);

     const typename Vec::EntryType zero = 0;

     COMPARE(a, Vec(zero));

     COMPARE(b, Vec(zero));

     COMPARE(c, Vec(zero));

     COMPARE(d, Vec(zero));

 }


 template<typename Vec> void testCmp()

 {

     typedef typename Vec::EntryType T;

     Vec a(Zero), b(Zero);

     COMPARE(a, b);

     if (!(a != b).isEmpty()) {

         std::cerr << a << " != " << b << ", (a != b) = " << (a != b) << ", (a == b) = " << (a == b) << std::endl;

     }

     VERIFY((a != b).isEmpty());


     Vec c(1);

     VERIFY((a < c).isFull());

     VERIFY((c > a).isFull());

     VERIFY((a <= b).isFull());

     VERIFY((a <= c).isFull());

     VERIFY((b >= a).isFull());

     VERIFY((c >= a).isFull());


     {

         const T max = static_cast<T>(std::numeric_limits<T>::max() * 0.95);

         const T min = 0;

         const T step = max / 200;

         T j = min;

         VERIFY(Vec(Zero) == Vec(j));

         VERIFY(!(Vec(Zero) < Vec(j)));

         VERIFY(!(Vec(Zero) > Vec(j)));

         VERIFY(!(Vec(Zero) != Vec(j)));

         j += step;

         for (int i = 0; i < 200; ++i, j += step) {

             if(Vec(Zero) >= Vec(j)) {

                 std::cout << j << " " << Vec(j) << " " << (Vec(Zero) >= Vec(j)) << std::endl;

             }

             VERIFY(Vec(Zero) < Vec(j));

             VERIFY(Vec(j) > Vec(Zero));

             VERIFY(!(Vec(Zero) >= Vec(j)));

             VERIFY(!(Vec(j) <= Vec(Zero)));

             VERIFY(!static_cast<bool>(Vec(Zero) >= Vec(j)));

             VERIFY(!static_cast<bool>(Vec(j) <= Vec(Zero)));

         }

     }

     if (std::numeric_limits<T>::min() <= 0) {

         const T min = static_cast<T>(std::numeric_limits<T>::min() * 0.95);

         if (min == 0) {

             return;

         }

         const T step = min / T(-201);

         T j = min;

         for (int i = 0; i < 200; ++i, j += step) {

             VERIFY(Vec(j) < Vec(Zero));

             VERIFY(Vec(Zero) > Vec(j));

             VERIFY(!(Vec(Zero) <= Vec(j)));

             VERIFY(!(Vec(j) >= Vec(Zero)));

         }

     }

 }


 template<typename Vec> void testIsMix()

 {

     Vec a(IndexesFromZero);

     Vec b(Zero);

     Vec c(One);

     if (Vec::Size > 1) {

         VERIFY((a == b).isMix());

         VERIFY((a != b).isMix());

         VERIFY((a == c).isMix());

         VERIFY((a != c).isMix());

         VERIFY(!(a == a).isMix());

         VERIFY(!(a != a).isMix());

     } else { // masks of size 1 can never be a mix of 0 and 1

         VERIFY(!(a == b).isMix());

         VERIFY(!(a != b).isMix());

         VERIFY(!(a == c).isMix());

         VERIFY(!(a != c).isMix());

         VERIFY(!(a == a).isMix());

         VERIFY(!(a != a).isMix());

     }

 }


 template<typename Vec> void testAdd()

 {

     Vec a(Zero), b(Zero);

     COMPARE(a, b);


     a += 1;

     Vec c(1);

     COMPARE(a, c);


     COMPARE(a, b + 1);

     COMPARE(a, b + c);

     Vec x(Zero);

 }


 template<typename Vec> void testSub()

 {

     Vec a(2), b(2);

     COMPARE(a, b);


     a -= 1;

     Vec c(1);

     COMPARE(a, c);


     COMPARE(a, b - 1);

     COMPARE(a, b - c);

 }


 template<typename V> void testMul()

 {

     for (int i = 0; i < 10000; ++i) {

         V a = V::Random();

         V b = V::Random();

         V reference = a;

         for (int j = 0; j < V::Size; ++j) {

             // this could overflow - but at least the compiler can't know about it so it doesn't

             // matter that it's undefined behavior in C++. The only thing that matters is what the

             // hardware does...

             reference[j] *= b[j];

         }

         COMPARE(a * b, reference) << a << " * " << b;

     }

 }


 template<typename Vec> void testMulAdd()

 {

     for (unsigned int i = 0; i < 0xffff; ++i) {

         const Vec i2(i * i + 1);

         Vec a(i);


         FUZZY_COMPARE(a * a + 1, i2);

     }

 }


 template<typename Vec> void testMulSub()

 {

     typedef typename Vec::EntryType T;

     for (unsigned int i = 0; i < 0xffff; ++i) {

         const T j = static_cast<T>(i);

         const Vec test(j);


         FUZZY_COMPARE(test * test - test, Vec(j * j - j));

     }

 }


 template<typename Vec> void testDiv()

 {

     typedef typename Vec::EntryType T;

     // If this test fails for ICC see here:

     // http://software.intel.com/en-us/forums/topic/488995


     const T stepsize = std::max(T(1), T(std::numeric_limits<T>::max() / 1024));

     for (T divisor = 1; divisor < 5; ++divisor) {

         for (T scalar = std::numeric_limits<T>::min(); scalar < std::numeric_limits<T>::max() - stepsize + 1; scalar += stepsize) {

             Vec vector(scalar);

             Vec reference(scalar / divisor);


             COMPARE(vector / divisor, reference) << '\n' << vector << " / " << divisor

                 << ", reference: " << scalar << " / " << divisor << " = " << scalar / divisor;

             vector /= divisor;

             COMPARE(vector, reference);

         }

     }

 }


 template<typename Vec> void testAnd()

 {

     Vec a(0x7fff);

     Vec b(0xf);

     COMPARE((a & 0xf), b);

     Vec c(IndexesFromZero);

     COMPARE(c, (c & 0xf));

     const typename Vec::EntryType zero = 0;

     COMPARE((c & 0x7ff0), Vec(zero));

 }


 template<typename Vec> void testShift()

 {

     typedef typename Vec::EntryType T;

     const T step = std::max<T>(1, std::numeric_limits<T>::max() / 1000);

     enum {

         NShifts = sizeof(T) * 8

     };

     for (Vec x = std::numeric_limits<Vec>::min() + Vec::IndexesFromZero();

             x <  std::numeric_limits<Vec>::max() - step;

             x += step) {

         for (size_t shift = 0; shift < NShifts; ++shift) {

             const Vec rightShift = x >> shift;

             const Vec leftShift  = x << shift;

             for (size_t k = 0; k < Vec::Size; ++k) {

                 COMPARE(rightShift[k], T(x[k] >> shift)) << ", x[k] = " << x[k] << ", shift = " << shift;

                 COMPARE(leftShift [k], T(x[k] << shift)) << ", x[k] = " << x[k] << ", shift = " << shift;

             }

         }

     }


     Vec a(1);

     Vec b(2);


     // left shifts

     COMPARE((a << 1), b);

     COMPARE((a << 2), (a << 2));

     COMPARE((a << 2), (b << 1));


     Vec shifts(IndexesFromZero);

     a <<= shifts;

     for (typename Vec::EntryType i = 0, x = 1; i < Vec::Size; ++i, x <<= 1) {

         COMPARE(a[i], x);

     }


     // right shifts

     a = Vec(4);

     COMPARE((a >> 1), b);

     COMPARE((a >> 2), (a >> 2));

     COMPARE((a >> 2), (b >> 1));


     a = Vec(16);

     a >>= shifts;

     for (typename Vec::EntryType i = 0, x = 16; i < Vec::Size; ++i, x >>= 1) {

         COMPARE(a[i], x);

     }

 }


 template<typename Vec> void testOnesComplement()

 {

     Vec a(One);

     Vec b = ~a;

     COMPARE(~a, b);

     COMPARE(~b, a);

     COMPARE(~(a + b), Vec(Zero));

 }


 template<typename T> struct NegateRangeHelper

 {

     typedef int Iterator;

     static const Iterator Start;

     static const Iterator End;

 };

 template<> struct NegateRangeHelper<unsigned int> {

     typedef unsigned int Iterator;

     static const Iterator Start;

     static const Iterator End;

 };

 template<> const int NegateRangeHelper<float>::Start = -0xffffff;

 template<> const int NegateRangeHelper<float>::End   =  0xffffff - 133;

 template<> const int NegateRangeHelper<double>::Start = -0xffffff;

 template<> const int NegateRangeHelper<double>::End   =  0xffffff - 133;

 template<> const int NegateRangeHelper<int>::Start = -0x7fffffff;

 template<> const int NegateRangeHelper<int>::End   = 0x7fffffff - 0xee;

 const unsigned int NegateRangeHelper<unsigned int>::Start = 0;

 const unsigned int NegateRangeHelper<unsigned int>::End = 0xffffffff - 0xee;

 template<> const int NegateRangeHelper<short>::Start = -0x7fff;

 template<> const int NegateRangeHelper<short>::End = 0x7fff - 0xee;

 template<> const int NegateRangeHelper<unsigned short>::Start = 0;

 template<> const int NegateRangeHelper<unsigned short>::End = 0xffff - 0xee;


 template<typename Vec> void testNegate()

 {

     typedef typename Vec::EntryType T;

     typedef NegateRangeHelper<T> Range;

     for (typename Range::Iterator i = Range::Start; i < Range::End; i += 0xef) {

         T i2 = static_cast<T>(i);

         Vec a(i2);


         COMPARE(static_cast<Vec>(-a), Vec(-i2)) << " i2: " << i2;

     }

 }


 template<typename Vec> void testMin()

 {

     typedef typename Vec::EntryType T;

     typedef typename Vec::Mask Mask;

     typedef typename Vec::IndexType I;


     Vec v(I::IndexesFromZero());


     COMPARE(v.min(), static_cast<T>(0));

     COMPARE((T(Vec::Size) - v).min(), static_cast<T>(1));


     int j = 0;

     Mask m;

     do {

         m = allMasks<Vec>(j++);

         if (m.isEmpty()) {

             break;

         }

         COMPARE(v.min(m), static_cast<T>(m.firstOne())) << m << v;

     } while (true);

 }


 template<typename Vec> void testMax()

 {

     typedef typename Vec::EntryType T;

     typedef typename Vec::Mask Mask;

     typedef typename Vec::IndexType I;


     Vec v(I::IndexesFromZero());


     COMPARE(v.max(), static_cast<T>(Vec::Size - 1));

     v = T(Vec::Size) - v;

     COMPARE(v.max(), static_cast<T>(Vec::Size));


     int j = 0;

     Mask m;

     do {

         m = allMasks<Vec>(j++);

         if (m.isEmpty()) {

             break;

         }

         COMPARE(v.max(m), static_cast<T>(Vec::Size - m.firstOne())) << m << v;

     } while (true);

 }


 template<typename Vec> void testProduct()

 {

     typedef typename Vec::EntryType T;

     typedef typename Vec::Mask Mask;


     for (int i = 0; i < 10; ++i) {

         T x = static_cast<T>(i);

         Vec v(x);

         T x2 = x;

         for (int k = Vec::Size; k > 1; k /= 2) {

             x2 *= x2;

         }

         COMPARE(v.product(), x2);


         int j = 0;

         Mask m;

         do {

             m = allMasks<Vec>(j++);

             if (m.isEmpty()) {

                 break;

             }

             if (std::numeric_limits<T>::is_exact) {

                 x2 = x;

                 for (int k = m.count(); k > 1; --k) {

                     x2 *= x;

                 }

             } else {

                 x2 = static_cast<T>(pow(static_cast<double>(x), m.count()));

             }

             COMPARE(v.product(m), x2) << m << v;

         } while (true);

     }

 }


 template<typename Vec> void testSum()

 {

     typedef typename Vec::EntryType T;

     typedef typename Vec::Mask Mask;


     for (int i = 0; i < 10; ++i) {

         T x = static_cast<T>(i);

         Vec v(x);

         COMPARE(v.sum(), x * Vec::Size);


         int j = 0;

         Mask m;

         do {

             m = allMasks<Vec>(j++);

             COMPARE(v.sum(m), x * m.count()) << m << v;

         } while (!m.isEmpty());

     }

 }


 template<typename V> void fma()

 {

     for (int i = 0; i < 1000; ++i) {

         V a = V::Random();

         const V b = V::Random();

         const V c = V::Random();

         const V reference = a * b + c;

         a.fusedMultiplyAdd(b, c);

         COMPARE(a, reference) << ", a = " << a << ", b = " << b << ", c = " << c;

     }

 }


 template<> void fma<float_v>()

 {

     float_v b = Vc_buildFloat(1, 0x000001, 0);

     float_v c = Vc_buildFloat(1, 0x000000, -24);

     float_v a = b;

     /*a *= b;

     a += c;

     COMPARE(a, float_v(Vc_buildFloat(1, 0x000002, 0)));

     a = b;*/

     a.fusedMultiplyAdd(b, c);

     COMPARE(a, float_v(Vc_buildFloat(1, 0x000003, 0)));


     a = Vc_buildFloat(1, 0x000002, 0);

     b = Vc_buildFloat(1, 0x000002, 0);

     c = Vc_buildFloat(-1, 0x000000, 0);

     /*a *= b;

     a += c;

     COMPARE(a, float_v(Vc_buildFloat(1, 0x000000, -21)));

     a = b;*/

     a.fusedMultiplyAdd(b, c); // 1 + 2^-21 + 2^-44 - 1 == (1 + 2^-20)*2^-18

     COMPARE(a, float_v(Vc_buildFloat(1, 0x000001, -21)));

 }


 template<> void fma<sfloat_v>()

 {

     sfloat_v b = Vc_buildFloat(1, 0x000001, 0);

     sfloat_v c = Vc_buildFloat(1, 0x000000, -24);

     sfloat_v a = b;

     /*a *= b;

     a += c;

     COMPARE(a, sfloat_v(Vc_buildFloat(1, 0x000002, 0)));

     a = b;*/

     a.fusedMultiplyAdd(b, c);

     COMPARE(a, sfloat_v(Vc_buildFloat(1, 0x000003, 0)));


     a = Vc_buildFloat(1, 0x000002, 0);

     b = Vc_buildFloat(1, 0x000002, 0);

     c = Vc_buildFloat(-1, 0x000000, 0);

     /*a *= b;

     a += c;

     COMPARE(a, sfloat_v(Vc_buildFloat(1, 0x000000, -21)));

     a = b;*/

     a.fusedMultiplyAdd(b, c); // 1 + 2^-21 + 2^-44 - 1 == (1 + 2^-20)*2^-18

     COMPARE(a, sfloat_v(Vc_buildFloat(1, 0x000001, -21)));

 }


 template<> void fma<double_v>()

 {

     double_v b = Vc_buildDouble(1, 0x0000000000001, 0);

     double_v c = Vc_buildDouble(1, 0x0000000000000, -53);

     double_v a = b;

     a.fusedMultiplyAdd(b, c);

     COMPARE(a, double_v(Vc_buildDouble(1, 0x0000000000003, 0)));


     a = Vc_buildDouble(1, 0x0000000000002, 0);

     b = Vc_buildDouble(1, 0x0000000000002, 0);

     c = Vc_buildDouble(-1, 0x0000000000000, 0);

     a.fusedMultiplyAdd(b, c); // 1 + 2^-50 + 2^-102 - 1

     COMPARE(a, double_v(Vc_buildDouble(1, 0x0000000000001, -50)));

 }


 int main(int argc, char **argv)

 {

     initTest(argc, argv);


     testAllTypes(fma);


     runTest(testZero<int_v>);

     runTest(testZero<uint_v>);

     runTest(testZero<float_v>);

     runTest(testZero<double_v>);

     runTest(testZero<short_v>);

     runTest(testZero<ushort_v>);

     runTest(testZero<sfloat_v>);


     runTest(testCmp<int_v>);

     runTest(testCmp<uint_v>);

     runTest(testCmp<float_v>);

     runTest(testCmp<double_v>);

     runTest(testCmp<short_v>);

     runTest(testCmp<ushort_v>);

     runTest(testCmp<sfloat_v>);


     runTest(testIsMix<int_v>);

     runTest(testIsMix<uint_v>);

     //runTest(testIsMix<float_v>);

     //runTest(testIsMix<double_v>);

     runTest(testIsMix<short_v>);

     runTest(testIsMix<ushort_v>);

     //runTest(testIsMix<sfloat_v>);


     runTest(testAdd<int_v>);

     runTest(testAdd<uint_v>);

     runTest(testAdd<float_v>);

     runTest(testAdd<double_v>);

     runTest(testAdd<short_v>);

     runTest(testAdd<ushort_v>);

     runTest(testAdd<sfloat_v>);


     runTest(testSub<int_v>);

     runTest(testSub<uint_v>);

     runTest(testSub<float_v>);

     runTest(testSub<double_v>);

     runTest(testSub<short_v>);

     runTest(testSub<ushort_v>);

     runTest(testSub<sfloat_v>);


     runTest(testMul<int_v>);

     runTest(testMul<uint_v>);

     runTest(testMul<float_v>);

     runTest(testMul<double_v>);

     runTest(testMul<short_v>);

     runTest(testMul<ushort_v>);

     runTest(testMul<sfloat_v>);


     runTest(testDiv<int_v>);

     runTest(testDiv<uint_v>);

     runTest(testDiv<float_v>);

     runTest(testDiv<double_v>);

     runTest(testDiv<short_v>);

     runTest(testDiv<ushort_v>);

     runTest(testDiv<sfloat_v>);


     runTest(testAnd<int_v>);

     runTest(testAnd<uint_v>);

     runTest(testAnd<short_v>);

     runTest(testAnd<ushort_v>);

     // no operator& for float/double


     runTest(testShift<int_v>);

     runTest(testShift<uint_v>);

     runTest(testShift<short_v>);

     runTest(testShift<ushort_v>);


     runTest(testMulAdd<int_v>);

     runTest(testMulAdd<uint_v>);

     runTest(testMulAdd<float_v>);

     runTest(testMulAdd<double_v>);

     runTest(testMulAdd<short_v>);

     runTest(testMulAdd<ushort_v>);

     runTest(testMulAdd<sfloat_v>);


     runTest(testMulSub<int_v>);

     runTest(testMulSub<uint_v>);

     runTest(testMulSub<float_v>);

     runTest(testMulSub<double_v>);

     runTest(testMulSub<short_v>);

     runTest(testMulSub<ushort_v>);

     runTest(testMulSub<sfloat_v>);


     runTest(testOnesComplement<int_v>);

     runTest(testOnesComplement<uint_v>);

     runTest(testOnesComplement<short_v>);

     runTest(testOnesComplement<ushort_v>);


     testAllTypes(testNegate);

     testAllTypes(testMin);

     testAllTypes(testMax);

     testAllTypes(testProduct);

     testAllTypes(testSum);


     return 0;

 }

ROOT::Vc::AVX::sfloat_v
Vector< sfloat > sfloat_v
Definition: vector.h:418

ROOT::Vc::sfloat_v
VECTOR_NAMESPACE::sfloat_v sfloat_v
Definition: vector.h:82

ROOT::Vc::AVX::min
static Vc_ALWAYS_INLINE int_v min(const int_v &x, const int_v &y)
Definition: vector.h:433

testMulSub
void testMulSub()
Definition: arithmetics.cpp:177

FUZZY_COMPARE
#define FUZZY_COMPARE(a, b)
Definition: unittest.h:506

initTest
void initTest(int argc, char **argv)
Definition: unittest.h:169

main
int main(int argc, char **argv)
Definition: arithmetics.cpp:482

xmlio::Size
const char * Size
Definition: TXMLSetup.cxx:56

ROOT::Math::Chebyshev::T
double T(double x)
Definition: ChebyshevPol.h:34

test
Definition: testInversion.cxx:24

fma< sfloat_v >
void fma< sfloat_v >()
Definition: arithmetics.cpp:444

a
TArc * a
Definition: textangle.C:12

fma< double_v >
void fma< double_v >()
Definition: arithmetics.cpp:467

testOnesComplement
void testOnesComplement()
Definition: arithmetics.cpp:266

testMulAdd
void testMulAdd()
Definition: arithmetics.cpp:167

ROOT::Vc::VectorSpecialInitializerIndexesFromZero::IndexesFromZero
Definition: types.h:45

fma< float_v >
void fma< float_v >()
Definition: arithmetics.cpp:421

x2
static const double x2[5]
Definition: RooGaussKronrodIntegrator1D.cxx:344

x
Double_t x[n]
Definition: legend1.C:17

COMPARE
#define COMPARE(a, b)
Definition: unittest.h:509

ROOT::Vc::VectorSpecialInitializerOne::One
Definition: types.h:44

pow
double pow(double, double)

ROOT::Vc::VectorSpecialInitializerZero::Zero
Definition: types.h:43

testAllTypes
#define testAllTypes(name)
Definition: unittest.h:43

testMul
void testMul()
Definition: arithmetics.cpp:151

Vc_buildDouble
#define Vc_buildDouble(sign, mantissa, exponent)
Definition: macros.h:283

ROOT::Vc::AVX::double_v
Vector< double > double_v
Definition: vector.h:416

v
SVector< double, 2 > v
Definition: Dict.h:5

testSum
void testSum()
Definition: arithmetics.cpp:390

ROOT::Vc::double_v
VECTOR_NAMESPACE::double_v double_v
Definition: vector.h:80

testAdd
void testAdd()
Definition: arithmetics.cpp:124

m
TMarker * m
Definition: textangle.C:8

unittest.h

testDiv
void testDiv()
Definition: arithmetics.cpp:188

testZero
void testZero()
Definition: arithmetics.cpp:28

testIsMix
void testIsMix()
Definition: arithmetics.cpp:102

VERIFY
#define VERIFY(cond)
Definition: unittest.h:515

macros.h

Vc_buildFloat
#define Vc_buildFloat(sign, mantissa, exponent)
Definition: macros.h:294

Random
void Random()
Definition: utils.cpp:154

testSub
void testSub()
Definition: arithmetics.cpp:138

ROOT::Vc::float_v
VECTOR_NAMESPACE::float_v float_v
Definition: vector.h:84

ROOT::Vc::AVX::max
static Vc_ALWAYS_INLINE int_v max(const int_v &x, const int_v &y)
Definition: vector.h:440

Range
Ta Range(0, 0, 1, 1)

sample_config.c
tuple c
Definition: sample_config.py:3

Rgl::Pad::End
void End()
Definition: TGLPadUtils.cxx:620

ROOT::Vc
Definition: casts.h:28

testMax
void testMax()
Definition: arithmetics.cpp:333

I
#define I(x, y, z)

testShift
void testShift()
Definition: arithmetics.cpp:219

testMin
void testMin()
Definition: arithmetics.cpp:311

testProduct
void testProduct()
Definition: arithmetics.cpp:356

testNegate
void testNegate()
Definition: arithmetics.cpp:299

testCmp
void testCmp()
Definition: arithmetics.cpp:46

testAnd
void testAnd()
Definition: arithmetics.cpp:208

fma
void fma()
Definition: arithmetics.cpp:409

runTest
#define runTest(name)
Definition: unittest.h:42

ROOT::Vc::AVX::float_v
Vector< float > float_v
Definition: vector.h:417