test/blasutil.cpp - eigen - Git at Google

 // This file is part of Eigen, a lightweight C++ template library
 // for linear algebra.
 //
 // Copyright (C) 2020 Everton Constantino <everton.constantino@ibm.com>
 //
 // This Source Code Form is subject to the terms of the Mozilla
 // Public License v. 2.0. If a copy of the MPL was not distributed
 // with this file, You can obtain one at http://mozilla.org/MPL/2.0/

 #include "main.h"

 // Disable "ignoring attributes on template argument"
 // for packet_traits<Packet*>
 // => The only workaround would be to wrap _m128 and the likes
 //    within wrappers.
 #if EIGEN_GNUC_AT_LEAST(6,0)
     #pragma GCC diagnostic ignored "-Wignored-attributes"
 #endif

 #define GET(i,j) (StorageOrder == RowMajor ? (i)*stride + (j) : (i) + (j)*stride)
 #define SCATTER(i,j,k) (StorageOrder == RowMajor ? ((i)+(k))*stride + (j) : (i) + ((j)+(k))*stride)

 template<typename Scalar, typename Packet>
 void compare(const Packet& a, const Packet& b)
 {
     int pktsz = internal::packet_traits<Scalar>::size;
     Scalar *buffA = new Scalar[pktsz];
     Scalar *buffB = new Scalar[pktsz];

     internal::pstoreu<Scalar, Packet>(buffA, a);
     internal::pstoreu<Scalar, Packet>(buffB, b);

     for(int i = 0; i < pktsz; i++)
     {
         VERIFY_IS_EQUAL(buffA[i], buffB[i]);
     }

     delete[] buffA;
     delete[] buffB;
 }

 template<typename Scalar, int StorageOrder, int n>
 struct PacketBlockSet
 {
     typedef typename internal::packet_traits<Scalar>::type Packet;

     void setPacketBlock(internal::PacketBlock<Packet,n>& block, Scalar value)
     {
         for(int idx = 0; idx < n; idx++)
         {
             block.packet[idx] = internal::pset1<Packet>(value);
         }
     }

     void comparePacketBlock(Scalar *data, int i, int j, int stride, internal::PacketBlock<Packet, n>& block)
     {
         for(int idx = 0; idx < n; idx++)
         {
             Packet line = internal::ploadu<Packet>(data + SCATTER(i,j,idx));
             compare<Scalar, Packet>(block.packet[idx], line);
         }
     }
 };

 template<typename Scalar, int StorageOrder, int BlockSize>
 void run_bdmp_spec_1()
 {
     typedef internal::blas_data_mapper<Scalar, int, StorageOrder> BlasDataMapper;
     int packetSize = internal::packet_traits<Scalar>::size;
     int minSize = std::max<int>(packetSize, BlockSize);
     typedef typename internal::packet_traits<Scalar>::type Packet;

     int szm = internal::random<int>(minSize,500), szn = internal::random<int>(minSize,500);
     int stride = StorageOrder == RowMajor ? szn : szm;
     Scalar *d = new Scalar[szn*szm];

     // Initializing with random entries
     for(int i = 0; i < szm*szn; i++)
     {
         d[i] = internal::random<Scalar>(static_cast<Scalar>(3), static_cast<Scalar>(10));
     }

     BlasDataMapper bdm(d, stride);

     // Testing operator()
     for(int i = 0; i < szm; i++)
     {
         for(int j = 0; j < szn; j++)
         {
             VERIFY_IS_EQUAL(d[GET(i,j)], bdm(i,j));
         }
     }

     // Testing getSubMapper and getLinearMapper
     int i0 = internal::random<int>(0,szm-2);
     int j0 = internal::random<int>(0,szn-2);
     for(int i = i0; i < szm; i++)
     {
         for(int j = j0; j < szn; j++)
         {
             const BlasDataMapper& bdmSM = bdm.getSubMapper(i0,j0);
             const internal::BlasLinearMapper<Scalar, int, 0>& bdmLM = bdm.getLinearMapper(i0,j0);

             Scalar v = bdmSM(i - i0, j - j0);
             Scalar vd = d[GET(i,j)];
             VERIFY_IS_EQUAL(vd, v);
             VERIFY_IS_EQUAL(vd, bdmLM(GET(i-i0, j-j0)));
         }
     }

     // Testing loadPacket
     for(int i = 0; i < szm - minSize; i++)
     {
         for(int j = 0; j < szn - minSize; j++)
         {
             Packet pktBDM = bdm.template loadPacket<Packet>(i,j);
             Packet pktD = internal::ploadu<Packet>(d + GET(i,j));

             compare<Scalar, Packet>(pktBDM, pktD);
         }
     }

     // Testing gatherPacket
     Scalar *buff = new Scalar[packetSize];
     for(int i = 0; i < szm - minSize; i++)
     {
         for(int j = 0; j < szn - minSize; j++)
         {
             Packet p = bdm.template gatherPacket<Packet>(i,j);
             internal::pstoreu<Scalar, Packet>(buff, p);

             for(int k = 0; k < packetSize; k++)
             {
                 VERIFY_IS_EQUAL(d[SCATTER(i,j,k)], buff[k]);
             }

         }
     }
     delete[] buff;

     // Testing scatterPacket
     for(int i = 0; i < szm - minSize; i++)
     {
         for(int j = 0; j < szn - minSize; j++)
         {
             Packet p = internal::pset1<Packet>(static_cast<Scalar>(1));
             bdm.template scatterPacket<Packet>(i,j,p);
             for(int k = 0; k < packetSize; k++)
             {
                 VERIFY_IS_EQUAL(d[SCATTER(i,j,k)], static_cast<Scalar>(1));
             }
         }
     }

     //Testing storePacketBlock
     internal::PacketBlock<Packet, BlockSize> block;

     PacketBlockSet<Scalar, StorageOrder, BlockSize> pbs;
     pbs.setPacketBlock(block, static_cast<Scalar>(2));

     for(int i = 0; i < szm - minSize; i++)
     {
         for(int j = 0; j < szn - minSize; j++)
         {
             bdm.template storePacketBlock<Packet, BlockSize>(i, j, block);

             pbs.comparePacketBlock(d, i, j, stride, block);
         }
     }

     delete[] d;
 }

 template<typename Scalar>
 void run_test()
 {
     run_bdmp_spec_1<Scalar, RowMajor, 1>();
     run_bdmp_spec_1<Scalar, ColMajor, 1>();
     run_bdmp_spec_1<Scalar, RowMajor, 2>();
     run_bdmp_spec_1<Scalar, ColMajor, 2>();
     run_bdmp_spec_1<Scalar, RowMajor, 4>();
     run_bdmp_spec_1<Scalar, ColMajor, 4>();
     run_bdmp_spec_1<Scalar, RowMajor, 8>();
     run_bdmp_spec_1<Scalar, ColMajor, 8>();
     run_bdmp_spec_1<Scalar, RowMajor, 16>();
     run_bdmp_spec_1<Scalar, ColMajor, 16>();
 }

 EIGEN_DECLARE_TEST(blasutil)
 {
     for(int i = 0; i < g_repeat; i++)
     {
         CALL_SUBTEST_1(run_test<numext::int8_t>());
         CALL_SUBTEST_2(run_test<numext::int16_t>());
         CALL_SUBTEST_3(run_test<numext::int32_t>());

 // TODO: Replace this by a call to numext::int64_t as soon as we have a way to
 // detect the typedef for int64_t on all platforms
 #if EIGEN_HAS_CXX11
         CALL_SUBTEST_4(run_test<signed long long>());
 #else
         CALL_SUBTEST_4(run_test<signed long>());
 #endif

         CALL_SUBTEST_5(run_test<float_t>());
         CALL_SUBTEST_6(run_test<double_t>());
         CALL_SUBTEST_7(run_test<std::complex<float> >());
         CALL_SUBTEST_8(run_test<std::complex<double> >());
     }
 }
	// This file is part of Eigen, a lightweight C++ template library
	// for linear algebra.
	//
	// Copyright (C) 2020 Everton Constantino <everton.constantino@ibm.com>
	//
	// This Source Code Form is subject to the terms of the Mozilla
	// Public License v. 2.0. If a copy of the MPL was not distributed
	// with this file, You can obtain one at http://mozilla.org/MPL/2.0/

	#include "main.h"

	// Disable "ignoring attributes on template argument"
	// for packet_traits<Packet*>
	// => The only workaround would be to wrap _m128 and the likes
	// within wrappers.
	#if EIGEN_GNUC_AT_LEAST(6,0)
	#pragma GCC diagnostic ignored "-Wignored-attributes"
	#endif

	#define GET(i,j) (StorageOrder == RowMajor ? (i)stride + (j) : (i) + (j)stride)
	#define SCATTER(i,j,k) (StorageOrder == RowMajor ? ((i)+(k))stride + (j) : (i) + ((j)+(k))stride)

	template<typename Scalar, typename Packet>
	void compare(const Packet& a, const Packet& b)
	{
	int pktsz = internal::packet_traits<Scalar>::size;
	Scalar *buffA = new Scalar[pktsz];
	Scalar *buffB = new Scalar[pktsz];

	internal::pstoreu<Scalar, Packet>(buffA, a);
	internal::pstoreu<Scalar, Packet>(buffB, b);

	for(int i = 0; i < pktsz; i++)
	{
	VERIFY_IS_EQUAL(buffA[i], buffB[i]);
	}

	delete[] buffA;
	delete[] buffB;
	}

	template<typename Scalar, int StorageOrder, int n>
	struct PacketBlockSet
	{
	typedef typename internal::packet_traits<Scalar>::type Packet;

	void setPacketBlock(internal::PacketBlock<Packet,n>& block, Scalar value)
	{
	for(int idx = 0; idx < n; idx++)
	{
	block.packet[idx] = internal::pset1<Packet>(value);
	}
	}

	void comparePacketBlock(Scalar *data, int i, int j, int stride, internal::PacketBlock<Packet, n>& block)
	{
	for(int idx = 0; idx < n; idx++)
	{
	Packet line = internal::ploadu<Packet>(data + SCATTER(i,j,idx));
	compare<Scalar, Packet>(block.packet[idx], line);
	}
	}
	};

	template<typename Scalar, int StorageOrder, int BlockSize>
	void run_bdmp_spec_1()
	{
	typedef internal::blas_data_mapper<Scalar, int, StorageOrder> BlasDataMapper;
	int packetSize = internal::packet_traits<Scalar>::size;
	int minSize = std::max<int>(packetSize, BlockSize);
	typedef typename internal::packet_traits<Scalar>::type Packet;

	int szm = internal::random<int>(minSize,500), szn = internal::random<int>(minSize,500);
	int stride = StorageOrder == RowMajor ? szn : szm;
	Scalar d = new Scalar[sznszm];

	// Initializing with random entries
	for(int i = 0; i < szm*szn; i++)
	{
	d[i] = internal::random<Scalar>(static_cast<Scalar>(3), static_cast<Scalar>(10));
	}

	BlasDataMapper bdm(d, stride);

	// Testing operator()
	for(int i = 0; i < szm; i++)
	{
	for(int j = 0; j < szn; j++)
	{
	VERIFY_IS_EQUAL(d[GET(i,j)], bdm(i,j));
	}
	}

	// Testing getSubMapper and getLinearMapper
	int i0 = internal::random<int>(0,szm-2);
	int j0 = internal::random<int>(0,szn-2);
	for(int i = i0; i < szm; i++)
	{
	for(int j = j0; j < szn; j++)
	{
	const BlasDataMapper& bdmSM = bdm.getSubMapper(i0,j0);
	const internal::BlasLinearMapper<Scalar, int, 0>& bdmLM = bdm.getLinearMapper(i0,j0);

	Scalar v = bdmSM(i - i0, j - j0);
	Scalar vd = d[GET(i,j)];
	VERIFY_IS_EQUAL(vd, v);
	VERIFY_IS_EQUAL(vd, bdmLM(GET(i-i0, j-j0)));
	}
	}

	// Testing loadPacket
	for(int i = 0; i < szm - minSize; i++)
	{
	for(int j = 0; j < szn - minSize; j++)
	{
	Packet pktBDM = bdm.template loadPacket<Packet>(i,j);
	Packet pktD = internal::ploadu<Packet>(d + GET(i,j));

	compare<Scalar, Packet>(pktBDM, pktD);
	}
	}

	// Testing gatherPacket
	Scalar *buff = new Scalar[packetSize];
	for(int i = 0; i < szm - minSize; i++)
	{
	for(int j = 0; j < szn - minSize; j++)
	{
	Packet p = bdm.template gatherPacket<Packet>(i,j);
	internal::pstoreu<Scalar, Packet>(buff, p);

	for(int k = 0; k < packetSize; k++)
	{
	VERIFY_IS_EQUAL(d[SCATTER(i,j,k)], buff[k]);
	}

	}
	}
	delete[] buff;

	// Testing scatterPacket
	for(int i = 0; i < szm - minSize; i++)
	{
	for(int j = 0; j < szn - minSize; j++)
	{
	Packet p = internal::pset1<Packet>(static_cast<Scalar>(1));
	bdm.template scatterPacket<Packet>(i,j,p);
	for(int k = 0; k < packetSize; k++)
	{
	VERIFY_IS_EQUAL(d[SCATTER(i,j,k)], static_cast<Scalar>(1));
	}
	}
	}

	//Testing storePacketBlock
	internal::PacketBlock<Packet, BlockSize> block;

	PacketBlockSet<Scalar, StorageOrder, BlockSize> pbs;
	pbs.setPacketBlock(block, static_cast<Scalar>(2));

	for(int i = 0; i < szm - minSize; i++)
	{
	for(int j = 0; j < szn - minSize; j++)
	{
	bdm.template storePacketBlock<Packet, BlockSize>(i, j, block);

	pbs.comparePacketBlock(d, i, j, stride, block);
	}
	}

	delete[] d;
	}

	template<typename Scalar>
	void run_test()
	{
	run_bdmp_spec_1<Scalar, RowMajor, 1>();
	run_bdmp_spec_1<Scalar, ColMajor, 1>();
	run_bdmp_spec_1<Scalar, RowMajor, 2>();
	run_bdmp_spec_1<Scalar, ColMajor, 2>();
	run_bdmp_spec_1<Scalar, RowMajor, 4>();
	run_bdmp_spec_1<Scalar, ColMajor, 4>();
	run_bdmp_spec_1<Scalar, RowMajor, 8>();
	run_bdmp_spec_1<Scalar, ColMajor, 8>();
	run_bdmp_spec_1<Scalar, RowMajor, 16>();
	run_bdmp_spec_1<Scalar, ColMajor, 16>();
	}

	EIGEN_DECLARE_TEST(blasutil)
	{
	for(int i = 0; i < g_repeat; i++)
	{
	CALL_SUBTEST_1(run_test<numext::int8_t>());
	CALL_SUBTEST_2(run_test<numext::int16_t>());
	CALL_SUBTEST_3(run_test<numext::int32_t>());

	// TODO: Replace this by a call to numext::int64_t as soon as we have a way to
	// detect the typedef for int64_t on all platforms
	#if EIGEN_HAS_CXX11
	CALL_SUBTEST_4(run_test<signed long long>());
	#else
	CALL_SUBTEST_4(run_test<signed long>());
	#endif

	CALL_SUBTEST_5(run_test<float_t>());
	CALL_SUBTEST_6(run_test<double_t>());
	CALL_SUBTEST_7(run_test<std::complex<float> >());
	CALL_SUBTEST_8(run_test<std::complex<double> >());
	}
	}