LIVE / thrust /testing /tuple_scan.cu
Xu Ma
update
1c3c0d9
raw
history blame
2.34 kB
#include <unittest/unittest.h>
#include <thrust/tuple.h>
#include <thrust/scan.h>
#include <thrust/transform.h>
#if THRUST_DEVICE_SYSTEM == THRUST_DEVICE_SYSTEM_CUDA
#include <unittest/cuda/testframework.h>
#endif
using namespace unittest;
struct SumTupleFunctor
{
template <typename Tuple>
__host__ __device__
Tuple operator()(const Tuple &lhs, const Tuple &rhs)
{
using thrust::get;
return thrust::make_tuple(get<0>(lhs) + get<0>(rhs),
get<1>(lhs) + get<1>(rhs));
}
};
struct MakeTupleFunctor
{
template<typename T1, typename T2>
__host__ __device__
thrust::tuple<T1,T2> operator()(T1 &lhs, T2 &rhs)
{
return thrust::make_tuple(lhs, rhs);
}
};
template <typename T>
struct TestTupleScan
{
void operator()(const size_t n)
{
using namespace thrust;
host_vector<T> h_t1 = unittest::random_integers<T>(n);
host_vector<T> h_t2 = unittest::random_integers<T>(n);
// initialize input
host_vector< tuple<T,T> > h_input(n);
transform(h_t1.begin(), h_t1.end(), h_t2.begin(), h_input.begin(), MakeTupleFunctor());
device_vector< tuple<T,T> > d_input = h_input;
// allocate output
tuple<T,T> zero(0,0);
host_vector < tuple<T,T> > h_output(n, zero);
device_vector< tuple<T,T> > d_output(n, zero);
// inclusive_scan
inclusive_scan(h_input.begin(), h_input.end(), h_output.begin(), SumTupleFunctor());
inclusive_scan(d_input.begin(), d_input.end(), d_output.begin(), SumTupleFunctor());
ASSERT_EQUAL_QUIET(h_output, d_output);
// The tests below get miscompiled on Tesla hw for 8b types
#if THRUST_DEVICE_SYSTEM == THRUST_DEVICE_SYSTEM_CUDA
if(const CUDATestDriver *driver = dynamic_cast<const CUDATestDriver*>(&UnitTestDriver::s_driver()))
{
if(sizeof(T) == sizeof(unittest::uint8_t) && driver->current_device_architecture() < 200)
{
KNOWN_FAILURE;
} // end if
} // end if
#endif
// exclusive_scan
tuple<T,T> init(13,17);
exclusive_scan(h_input.begin(), h_input.end(), h_output.begin(), init, SumTupleFunctor());
exclusive_scan(d_input.begin(), d_input.end(), d_output.begin(), init, SumTupleFunctor());
ASSERT_EQUAL_QUIET(h_output, d_output);
}
};
VariableUnitTest<TestTupleScan, IntegralTypes> TestTupleScanInstance;