From 44861dcbfeee041223c4aac1ee075e92fa4daa01 Mon Sep 17 00:00:00 2001 From: Stanislaw Halik Date: Sun, 18 Sep 2016 12:42:15 +0200 Subject: update --- eigen/test/packetmath.cpp | 385 ++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 385 insertions(+) create mode 100644 eigen/test/packetmath.cpp (limited to 'eigen/test/packetmath.cpp') diff --git a/eigen/test/packetmath.cpp b/eigen/test/packetmath.cpp new file mode 100644 index 0000000..38aa256 --- /dev/null +++ b/eigen/test/packetmath.cpp @@ -0,0 +1,385 @@ +// This file is part of Eigen, a lightweight C++ template library +// for linear algebra. +// +// Copyright (C) 2008-2009 Gael Guennebaud +// Copyright (C) 2006-2008 Benoit Jacob +// +// This Source Code Form is subject to the terms of the Mozilla +// Public License v. 2.0. If a copy of the MPL was not distributed +// with this file, You can obtain one at http://mozilla.org/MPL/2.0/. + +#include "main.h" + +// using namespace Eigen; + +namespace Eigen { +namespace internal { +template T negate(const T& x) { return -x; } +} +} + +template bool isApproxAbs(const Scalar& a, const Scalar& b, const typename NumTraits::Real& refvalue) +{ + return internal::isMuchSmallerThan(a-b, refvalue); +} + +template bool areApproxAbs(const Scalar* a, const Scalar* b, int size, const typename NumTraits::Real& refvalue) +{ + for (int i=0; i >(a,size) << "]" << " != " << Map >(b,size) << "\n"; + return false; + } + } + return true; +} + +template bool areApprox(const Scalar* a, const Scalar* b, int size) +{ + for (int i=0; i >(a,size) << "]" << " != " << Map >(b,size) << "\n"; + return false; + } + } + return true; +} + + +#define CHECK_CWISE2(REFOP, POP) { \ + for (int i=0; i(data1), internal::pload(data1+PacketSize))); \ + VERIFY(areApprox(ref, data2, PacketSize) && #POP); \ +} + +#define CHECK_CWISE1(REFOP, POP) { \ + for (int i=0; i(data1))); \ + VERIFY(areApprox(ref, data2, PacketSize) && #POP); \ +} + +template +struct packet_helper +{ + template + inline Packet load(const T* from) const { return internal::pload(from); } + + template + inline void store(T* to, const Packet& x) const { internal::pstore(to,x); } +}; + +template +struct packet_helper +{ + template + inline T load(const T* from) const { return *from; } + + template + inline void store(T* to, const T& x) const { *to = x; } +}; + +#define CHECK_CWISE1_IF(COND, REFOP, POP) if(COND) { \ + packet_helper h; \ + for (int i=0; i void packetmath() +{ + using std::abs; + typedef typename internal::packet_traits::type Packet; + const int PacketSize = internal::packet_traits::size; + typedef typename NumTraits::Real RealScalar; + + const int size = PacketSize*4; + EIGEN_ALIGN16 Scalar data1[internal::packet_traits::size*4]; + EIGEN_ALIGN16 Scalar data2[internal::packet_traits::size*4]; + EIGEN_ALIGN16 Packet packets[PacketSize*2]; + EIGEN_ALIGN16 Scalar ref[internal::packet_traits::size*4]; + RealScalar refvalue = 0; + for (int i=0; i()/RealScalar(PacketSize); + data2[i] = internal::random()/RealScalar(PacketSize); + refvalue = (std::max)(refvalue,abs(data1[i])); + } + + internal::pstore(data2, internal::pload(data1)); + VERIFY(areApprox(data1, data2, PacketSize) && "aligned load/store"); + + for (int offset=0; offset(data1+offset)); + VERIFY(areApprox(data1+offset, data2, PacketSize) && "internal::ploadu"); + } + + for (int offset=0; offset(data1)); + VERIFY(areApprox(data1, data2+offset, PacketSize) && "internal::pstoreu"); + } + + for (int offset=0; offset(data1); + packets[1] = internal::pload(data1+PacketSize); + if (offset==0) internal::palign<0>(packets[0], packets[1]); + else if (offset==1) internal::palign<1>(packets[0], packets[1]); + else if (offset==2) internal::palign<2>(packets[0], packets[1]); + else if (offset==3) internal::palign<3>(packets[0], packets[1]); + internal::pstore(data2, packets[0]); + + for (int i=0; i::value) + CHECK_CWISE2(REF_DIV, internal::pdiv); + #endif + CHECK_CWISE1(internal::negate, internal::pnegate); + CHECK_CWISE1(numext::conj, internal::pconj); + + for(int offset=0;offset<3;++offset) + { + for (int i=0; i(data1[offset])); + VERIFY(areApprox(ref, data2, PacketSize) && "internal::pset1"); + } + + VERIFY(internal::isApprox(data1[0], internal::pfirst(internal::pload(data1))) && "internal::pfirst"); + + if(PacketSize>1) + { + for(int offset=0;offset<4;++offset) + { + for(int i=0;i(data1+offset)); + VERIFY(areApprox(ref, data2, PacketSize) && "ploaddup"); + } + } + + ref[0] = 0; + for (int i=0; i(data1)), refvalue) && "internal::predux"); + + ref[0] = 1; + for (int i=0; i(data1))) && "internal::predux_mul"); + + for (int j=0; j(data1+j*PacketSize); + } + internal::pstore(data2, internal::preduxp(packets)); + VERIFY(areApproxAbs(ref, data2, PacketSize, refvalue) && "internal::preduxp"); + + for (int i=0; i(data1))); + VERIFY(areApprox(ref, data2, PacketSize) && "internal::preverse"); +} + +template void packetmath_real() +{ + using std::abs; + typedef typename internal::packet_traits::type Packet; + const int PacketSize = internal::packet_traits::size; + + const int size = PacketSize*4; + EIGEN_ALIGN16 Scalar data1[internal::packet_traits::size*4]; + EIGEN_ALIGN16 Scalar data2[internal::packet_traits::size*4]; + EIGEN_ALIGN16 Scalar ref[internal::packet_traits::size*4]; + + for (int i=0; i(-1,1) * std::pow(Scalar(10), internal::random(-3,3)); + data2[i] = internal::random(-1,1) * std::pow(Scalar(10), internal::random(-3,3)); + } + CHECK_CWISE1_IF(internal::packet_traits::HasSin, std::sin, internal::psin); + CHECK_CWISE1_IF(internal::packet_traits::HasCos, std::cos, internal::pcos); + CHECK_CWISE1_IF(internal::packet_traits::HasTan, std::tan, internal::ptan); + + for (int i=0; i(-1,1); + data2[i] = internal::random(-1,1); + } + CHECK_CWISE1_IF(internal::packet_traits::HasASin, std::asin, internal::pasin); + CHECK_CWISE1_IF(internal::packet_traits::HasACos, std::acos, internal::pacos); + + for (int i=0; i(-87,88); + data2[i] = internal::random(-87,88); + } + CHECK_CWISE1_IF(internal::packet_traits::HasExp, std::exp, internal::pexp); + { + data1[0] = std::numeric_limits::quiet_NaN(); + packet_helper::HasExp,Packet> h; + h.store(data2, internal::pexp(h.load(data1))); + VERIFY(isNaN(data2[0])); + } + + for (int i=0; i(0,1) * std::pow(Scalar(10), internal::random(-6,6)); + data2[i] = internal::random(0,1) * std::pow(Scalar(10), internal::random(-6,6)); + } + if(internal::random(0,1)<0.1) + data1[internal::random(0, PacketSize)] = 0; + CHECK_CWISE1_IF(internal::packet_traits::HasSqrt, std::sqrt, internal::psqrt); + CHECK_CWISE1_IF(internal::packet_traits::HasLog, std::log, internal::plog); + { + data1[0] = std::numeric_limits::quiet_NaN(); + packet_helper::HasLog,Packet> h; + h.store(data2, internal::plog(h.load(data1))); + VERIFY(isNaN(data2[0])); + data1[0] = -1.0f; + h.store(data2, internal::plog(h.load(data1))); + VERIFY(isNaN(data2[0])); +#if !EIGEN_FAST_MATH + h.store(data2, internal::psqrt(h.load(data1))); + VERIFY(isNaN(data2[0])); + VERIFY(isNaN(data2[1])); +#endif + } +} + +template void packetmath_notcomplex() +{ + using std::abs; + typedef typename internal::packet_traits::type Packet; + const int PacketSize = internal::packet_traits::size; + + EIGEN_ALIGN16 Scalar data1[internal::packet_traits::size*4]; + EIGEN_ALIGN16 Scalar data2[internal::packet_traits::size*4]; + EIGEN_ALIGN16 Scalar ref[internal::packet_traits::size*4]; + + Array::Map(data1, internal::packet_traits::size*4).setRandom(); + + ref[0] = data1[0]; + for (int i=0; i(data1))) && "internal::predux_min"); + + CHECK_CWISE2((std::min), internal::pmin); + CHECK_CWISE2((std::max), internal::pmax); + CHECK_CWISE1(abs, internal::pabs); + + ref[0] = data1[0]; + for (int i=0; i(data1))) && "internal::predux_max"); + + for (int i=0; i void test_conj_helper(Scalar* data1, Scalar* data2, Scalar* ref, Scalar* pval) +{ + typedef typename internal::packet_traits::type Packet; + const int PacketSize = internal::packet_traits::size; + + internal::conj_if cj0; + internal::conj_if cj1; + internal::conj_helper cj; + internal::conj_helper pcj; + + for(int i=0;i(data1),internal::pload(data2))); + VERIFY(areApprox(ref, pval, PacketSize) && "conj_helper pmul"); + + for(int i=0;i(data1),internal::pload(data2),internal::pload(pval))); + VERIFY(areApprox(ref, pval, PacketSize) && "conj_helper pmadd"); +} + +template void packetmath_complex() +{ + typedef typename internal::packet_traits::type Packet; + const int PacketSize = internal::packet_traits::size; + + const int size = PacketSize*4; + EIGEN_ALIGN16 Scalar data1[PacketSize*4]; + EIGEN_ALIGN16 Scalar data2[PacketSize*4]; + EIGEN_ALIGN16 Scalar ref[PacketSize*4]; + EIGEN_ALIGN16 Scalar pval[PacketSize*4]; + + for (int i=0; i() * Scalar(1e2); + data2[i] = internal::random() * Scalar(1e2); + } + + test_conj_helper (data1,data2,ref,pval); + test_conj_helper (data1,data2,ref,pval); + test_conj_helper (data1,data2,ref,pval); + test_conj_helper (data1,data2,ref,pval); + + { + for(int i=0;i(data1))); + VERIFY(areApprox(ref, pval, PacketSize) && "pcplxflip"); + } + + +} + +void test_packetmath() +{ + for(int i = 0; i < g_repeat; i++) { + CALL_SUBTEST_1( packetmath() ); + CALL_SUBTEST_2( packetmath() ); + CALL_SUBTEST_3( packetmath() ); + CALL_SUBTEST_1( packetmath >() ); + CALL_SUBTEST_2( packetmath >() ); + + CALL_SUBTEST_1( packetmath_notcomplex() ); + CALL_SUBTEST_2( packetmath_notcomplex() ); + CALL_SUBTEST_3( packetmath_notcomplex() ); + + CALL_SUBTEST_1( packetmath_real() ); + CALL_SUBTEST_2( packetmath_real() ); + + CALL_SUBTEST_1( packetmath_complex >() ); + CALL_SUBTEST_2( packetmath_complex >() ); + } +} -- cgit v1.2.3