compute/test/test_merge_sort_gpu.cpp
2016-07-10 18:38:23 +02:00

375 lines
10 KiB
C++

//---------------------------------------------------------------------------//
// Copyright (c) 2016 Jakub Szuppe <j.szuppe@gmail.com>
//
// Distributed under the Boost Software License, Version 1.0
// See accompanying file LICENSE_1_0.txt or copy at
// http://www.boost.org/LICENSE_1_0.txt
//
// See http://boostorg.github.com/compute for more information.
//---------------------------------------------------------------------------//
#define BOOST_TEST_MODULE TestMergeSortOnGPU
#include <boost/test/unit_test.hpp>
#include <iostream>
#include <boost/compute/system.hpp>
#include <boost/compute/algorithm/is_sorted.hpp>
#include <boost/compute/algorithm/detail/merge_sort_on_gpu.hpp>
#include <boost/compute/container/vector.hpp>
#include "quirks.hpp"
#include "check_macros.hpp"
#include "context_setup.hpp"
namespace bc = boost::compute;
BOOST_AUTO_TEST_CASE(sort_small_vector_char)
{
if(is_apple_cpu_device(device)) {
std::cerr
<< "skipping all merge_sort_on_gpu tests due to Apple platform"
<< " behavior when local memory is used on a CPU device"
<< std::endl;
return;
}
using boost::compute::char_;
::boost::compute::greater<char_> greater;
::boost::compute::less<char_> less;
char_ data[] = { 'c', 'a', '0', '7', 'B', 'F', '\0', '$' };
boost::compute::vector<char_> vector(data, data + 8, queue);
BOOST_CHECK_EQUAL(vector.size(), size_t(8));
BOOST_CHECK(boost::compute::is_sorted(vector.begin(), vector.end(), queue) == false);
// <
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), less, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
);
CHECK_RANGE_EQUAL(char_, 8, vector, ('\0', '$', '0', '7', 'B', 'F', 'a', 'c'));
// >
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), greater, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
);
CHECK_RANGE_EQUAL(char_, 8, vector, ('c', 'a', 'F', 'B', '7', '0', '$', '\0'));
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_int)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::int_;
::boost::compute::greater<int_> greater;
::boost::compute::less<int_> less;
const int_ size = 748;
std::vector<int_> data(size);
for(int_ i = 0; i < size; i++){
data[i] = i%2 ? i : -i;
}
boost::compute::vector<int_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
// <
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), less, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
);
// >
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), greater, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
);
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_ulong)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::ulong_;
::boost::compute::greater<ulong_> greater;
::boost::compute::less<ulong_> less;
const ulong_ size = 260;
std::vector<ulong_> data(size);
for(ulong_ i = 0; i < size; i++){
data[i] = i%2 ? i : i * i;
}
boost::compute::vector<ulong_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
// <
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), less, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
);
// >
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), greater, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
);
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_float)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::float_;
::boost::compute::greater<float_> greater;
::boost::compute::less<float_> less;
const int size = 513;
std::vector<float_> data(size);
for(int i = 0; i < size; i++){
data[i] = float_(i%2 ? i : -i);
}
boost::compute::vector<float_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
// <
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), less, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
);
// >
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), greater, queue
);
queue.finish();
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
);
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_double)
{
if(is_apple_cpu_device(device)) {
return;
}
if(!device.supports_extension("cl_khr_fp64")){
std::cout << "skipping test: device does not support double" << std::endl;
return;
}
using boost::compute::double_;
::boost::compute::greater<double_> greater;
::boost::compute::less<double_> less;
const int size = 1023;
std::vector<double_> data(size);
for(int i = 0; i < size; i++){
data[i] = double_(i%2 ? i : -i);
}
boost::compute::vector<double_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
// <
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), less, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
);
// >
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), greater, queue
);
queue.finish();
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
);
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_int_custom_comparison_func)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::int_;
::boost::compute::greater<int_> greater;
::boost::compute::less<int_> less;
const int_ size = 1024;
std::vector<int_> data(size);
for(int_ i = 0; i < size; i++){
data[i] = i%2 ? size - i : i - size;
}
BOOST_COMPUTE_FUNCTION(bool, abs_sort, (int_ a, int_ b),
{
return abs(a) < abs(b);
});
boost::compute::vector<int_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(
!boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
);
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), abs_sort, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
);
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_int2)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::int2_;
using boost::compute::int_;
::boost::compute::greater<int2_> greater;
::boost::compute::less<int2_> less;
const int_ size = 1024;
std::vector<int2_> data(size);
for(int_ i = 0; i < size; i++){
data[i] = i%2 ? int2_(i, i) : int2_(i - size, i - size);
}
BOOST_COMPUTE_FUNCTION(bool, abs_sort, (int2_ a, int2_ b),
{
return abs(a.x + a.y) < abs(b.x + b.y);
});
boost::compute::vector<int2_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(
!boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
);
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), abs_sort, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
);
}
BOOST_AUTO_TEST_CASE(sort_mid_vector_long8)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::long8_;
using boost::compute::long_;
::boost::compute::greater<long8_> greater;
::boost::compute::less<long8_> less;
const long_ size = 256;
std::vector<long8_> data(size);
for(long_ i = 0; i < size; i++){
data[i] = i%2 ? long8_(i) : long8_(i * i);
}
BOOST_COMPUTE_FUNCTION(bool, comp, (long8_ a, long8_ b),
{
return a.s0 < b.s3;
});
boost::compute::vector<long8_> vector(data.begin(), data.end(), queue);
BOOST_CHECK_EQUAL(vector.size(), size);
BOOST_CHECK(
!boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
);
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), comp, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
);
}
BOOST_AUTO_TEST_CASE(stable_sort_vector_int2)
{
if(is_apple_cpu_device(device)) {
return;
}
using boost::compute::int2_;
int2_ data[] = {
int2_(8, 3), int2_(5, 1),
int2_(2, 1), int2_(6, 1),
int2_(8, 1), int2_(7, 1),
int2_(4, 1), int2_(8, 2)
};
BOOST_COMPUTE_FUNCTION(bool, comp, (int2_ a, int2_ b),
{
return a.x < b.x;
});
boost::compute::vector<int2_> vector(data, data + 8, queue);
BOOST_CHECK_EQUAL(vector.size(), 8);
BOOST_CHECK(
!boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
);
//
boost::compute::detail::merge_sort_on_gpu(
vector.begin(), vector.end(), comp, true /*stable*/, queue
);
BOOST_CHECK(
boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
);
CHECK_RANGE_EQUAL(
int2_, 8, vector,
(
int2_(2, 1), int2_(4, 1),
int2_(5, 1), int2_(6, 1),
int2_(7, 1), int2_(8, 3),
int2_(8, 1), int2_(8, 2)
)
);
}
BOOST_AUTO_TEST_SUITE_END()