compute/test/test_scan.cpp
2016-07-25 22:37:17 +02:00

491 lines
16 KiB
C++

//---------------------------------------------------------------------------//
// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
//
// Distributed under the Boost Software License, Version 1.0
// See accompanying file LICENSE_1_0.txt or copy at
// http://www.boost.org/LICENSE_1_0.txt
//
// See http://boostorg.github.com/compute for more information.
//---------------------------------------------------------------------------//
// Undefining BOOST_COMPUTE_USE_OFFLINE_CACHE macro as we want to modify cached
// parameters for copy algorithm without any undesirable consequences (like
// saving modified values of those parameters).
#ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE
#undef BOOST_COMPUTE_USE_OFFLINE_CACHE
#endif
#define BOOST_TEST_MODULE TestScan
#include <boost/test/unit_test.hpp>
#include <numeric>
#include <functional>
#include <vector>
#include <boost/compute/functional.hpp>
#include <boost/compute/lambda.hpp>
#include <boost/compute/system.hpp>
#include <boost/compute/command_queue.hpp>
#include <boost/compute/algorithm/copy.hpp>
#include <boost/compute/algorithm/exclusive_scan.hpp>
#include <boost/compute/algorithm/inclusive_scan.hpp>
#include <boost/compute/container/vector.hpp>
#include <boost/compute/iterator/counting_iterator.hpp>
#include <boost/compute/iterator/transform_iterator.hpp>
#include "check_macros.hpp"
#include "context_setup.hpp"
namespace bc = boost::compute;
BOOST_AUTO_TEST_CASE(inclusive_scan_int)
{
using boost::compute::uint_;
using boost::compute::int_;
int_ data[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 };
bc::vector<int_> vector(data, data + 12, queue);
BOOST_CHECK_EQUAL(vector.size(), size_t(12));
bc::vector<int_> result(12, context);
BOOST_CHECK_EQUAL(result.size(), size_t(12));
// inclusive scan
bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
// in-place inclusive scan
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
// scan_on_cpu
bc::copy(data, data + 12, vector.begin(), queue);
// make sure parallel scan_on_cpu is used, no serial_scan
std::string cache_key =
"__boost_scan_cpu_4";
boost::shared_ptr<bc::detail::parameter_cache> parameters =
bc::detail::parameter_cache::get_global_cache(device);
// save
uint_ map_copy_threshold =
parameters->get(cache_key, "serial_scan_threshold", 0);
// force parallel scan_on_cpu
parameters->set(cache_key, "serial_scan_threshold", 0);
// inclusive scan
bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
// in-place inclusive scan
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
// restore
parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
}
BOOST_AUTO_TEST_CASE(exclusive_scan_int)
{
using boost::compute::uint_;
using boost::compute::int_;
int_ data[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 };
bc::vector<int_> vector(data, data + 12, queue);
BOOST_CHECK_EQUAL(vector.size(), size_t(12));
bc::vector<int_> result(size_t(12), int_(0), queue);
BOOST_CHECK_EQUAL(result.size(), size_t(12));
// exclusive scan
bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, result, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
// in-place exclusive scan
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
// scan_on_cpu
bc::copy(data, data + 12, vector.begin(), queue);
// make sure parallel scan_on_cpu is used, no serial_scan
std::string cache_key =
"__boost_scan_cpu_4";
boost::shared_ptr<bc::detail::parameter_cache> parameters =
bc::detail::parameter_cache::get_global_cache(device);
// save
uint_ map_copy_threshold =
parameters->get(cache_key, "serial_scan_threshold", 0);
// force parallel scan_on_cpu
parameters->set(cache_key, "serial_scan_threshold", 0);
// exclusive scan
bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, result, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
// in-place exclusive scan
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
CHECK_RANGE_EQUAL(int_, 12, vector, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
// restore
parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
}
BOOST_AUTO_TEST_CASE(inclusive_scan_int2)
{
using boost::compute::int_;
using boost::compute::uint_;
using boost::compute::int2_;
int_ data[] = { 1, 2,
3, 4,
5, 6,
7, 8,
9, 0 };
boost::compute::vector<int2_> input(reinterpret_cast<int2_*>(data),
reinterpret_cast<int2_*>(data) + 5,
queue);
BOOST_CHECK_EQUAL(input.size(), size_t(5));
boost::compute::vector<int2_> output(5, context);
boost::compute::inclusive_scan(input.begin(), input.end(), output.begin(),
queue);
CHECK_RANGE_EQUAL(
int2_, 5, output,
(int2_(1, 2), int2_(4, 6), int2_(9, 12), int2_(16, 20), int2_(25, 20))
);
// scan_on_cpu
// make sure parallel scan_on_cpu is used, no serial_scan
std::string cache_key =
"__boost_scan_cpu_8";
boost::shared_ptr<bc::detail::parameter_cache> parameters =
bc::detail::parameter_cache::get_global_cache(device);
// save
uint_ map_copy_threshold =
parameters->get(cache_key, "serial_scan_threshold", 0);
// force parallel scan_on_cpu
parameters->set(cache_key, "serial_scan_threshold", 0);
boost::compute::inclusive_scan(input.begin(), input.end(), output.begin(),
queue);
CHECK_RANGE_EQUAL(
int2_, 5, output,
(int2_(1, 2), int2_(4, 6), int2_(9, 12), int2_(16, 20), int2_(25, 20))
);
// restore
parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
}
BOOST_AUTO_TEST_CASE(inclusive_scan_counting_iterator)
{
using boost::compute::int_;
using boost::compute::uint_;
bc::vector<int_> result(10, context);
bc::inclusive_scan(bc::make_counting_iterator(1),
bc::make_counting_iterator(11),
result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 10, result, (1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
// scan_on_cpu
// make sure parallel scan_on_cpu is used, no serial_scan
std::string cache_key =
"__boost_scan_cpu_4";
boost::shared_ptr<bc::detail::parameter_cache> parameters =
bc::detail::parameter_cache::get_global_cache(device);
// save
uint_ map_copy_threshold =
parameters->get(cache_key, "serial_scan_threshold", 0);
// force parallel scan_on_cpu
parameters->set(cache_key, "serial_scan_threshold", 0);
bc::inclusive_scan(bc::make_counting_iterator(1),
bc::make_counting_iterator(11),
result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 10, result, (1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
// restore
parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
}
BOOST_AUTO_TEST_CASE(exclusive_scan_counting_iterator)
{
using boost::compute::int_;
using boost::compute::uint_;
bc::vector<int_> result(10, context);
bc::exclusive_scan(bc::make_counting_iterator(1),
bc::make_counting_iterator(11),
result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 10, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45));
// scan_on_cpu
// make sure parallel scan_on_cpu is used, no serial_scan
std::string cache_key =
"__boost_scan_cpu_4";
boost::shared_ptr<bc::detail::parameter_cache> parameters =
bc::detail::parameter_cache::get_global_cache(device);
// save
uint_ map_copy_threshold =
parameters->get(cache_key, "serial_scan_threshold", 0);
// force parallel scan_on_cpu
parameters->set(cache_key, "serial_scan_threshold", 0);
bc::exclusive_scan(bc::make_counting_iterator(1),
bc::make_counting_iterator(11),
result.begin(), queue);
CHECK_RANGE_EQUAL(int_, 10, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45));
// restore
parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
}
BOOST_AUTO_TEST_CASE(inclusive_scan_transform_iterator)
{
float data[] = { 1.0f, 2.0f, 3.0f, 4.0f, 5.0f };
bc::vector<float> input(data, data + 5, queue);
bc::vector<float> output(5, context);
// normal inclusive scan of the input
bc::inclusive_scan(input.begin(), input.end(), output.begin(), queue);
queue.finish();
BOOST_CHECK_CLOSE(float(output[0]), 1.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[1]), 3.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[2]), 6.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[3]), 10.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[4]), 15.0f, 1e-4f);
// inclusive scan of squares of the input
using ::boost::compute::_1;
bc::inclusive_scan(bc::make_transform_iterator(input.begin(), pown(_1, 2)),
bc::make_transform_iterator(input.end(), pown(_1, 2)),
output.begin(), queue);
queue.finish();
BOOST_CHECK_CLOSE(float(output[0]), 1.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[1]), 5.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[2]), 14.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[3]), 30.0f, 1e-4f);
BOOST_CHECK_CLOSE(float(output[4]), 55.0f, 1e-4f);
}
BOOST_AUTO_TEST_CASE(inclusive_scan_doctest)
{
//! [inclusive_scan_int]
// setup input
int data[] = { 1, 2, 3, 4 };
boost::compute::vector<int> input(data, data + 4, queue);
// setup output
boost::compute::vector<int> output(4, context);
// scan values
boost::compute::inclusive_scan(
input.begin(), input.end(), output.begin(), queue
);
// output = [ 1, 3, 6, 10 ]
//! [inclusive_scan_int]
CHECK_RANGE_EQUAL(int, 4, output, (1, 3, 6, 10));
}
BOOST_AUTO_TEST_CASE(exclusive_scan_doctest)
{
//! [exclusive_scan_int]
// setup input
int data[] = { 1, 2, 3, 4 };
boost::compute::vector<int> input(data, data + 4, queue);
// setup output
boost::compute::vector<int> output(4, context);
// scan values
boost::compute::exclusive_scan(
input.begin(), input.end(), output.begin(), queue
);
// output = [ 0, 1, 3, 6 ]
//! [exclusive_scan_int]
CHECK_RANGE_EQUAL(int, 4, output, (0, 1, 3, 6));
}
BOOST_AUTO_TEST_CASE(inclusive_scan_int_multiplies)
{
//! [inclusive_scan_int_multiplies]
// setup input
int data[] = { 1, 2, 1, 2, 3 };
boost::compute::vector<int> input(data, data + 5, queue);
// setup output
boost::compute::vector<int> output(5, context);
// inclusive scan with multiplication
boost::compute::inclusive_scan(
input.begin(), input.end(), output.begin(),
boost::compute::multiplies<int>(), queue
);
// output = [1, 2, 2, 4, 12]
//! [inclusive_scan_int_multiplies]
BOOST_CHECK_EQUAL(input.size(), size_t(5));
BOOST_CHECK_EQUAL(output.size(), size_t(5));
CHECK_RANGE_EQUAL(int, 5, output, (1, 2, 2, 4, 12));
// in-place inclusive scan
CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 1, 2, 3));
boost::compute::inclusive_scan(input.begin(), input.end(), input.begin(),
boost::compute::multiplies<int>(), queue);
CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 2, 4, 12));
}
BOOST_AUTO_TEST_CASE(exclusive_scan_int_multiplies)
{
//! [exclusive_scan_int_multiplies]
// setup input
int data[] = { 1, 2, 1, 2, 3 };
boost::compute::vector<int> input(data, data + 5, queue);
// setup output
boost::compute::vector<int> output(5, context);
// exclusive_scan with multiplication
// initial value equals 10
boost::compute::exclusive_scan(
input.begin(), input.end(), output.begin(),
int(10), boost::compute::multiplies<int>(), queue
);
// output = [10, 10, 20, 20, 40]
//! [exclusive_scan_int_multiplies]
BOOST_CHECK_EQUAL(input.size(), size_t(5));
BOOST_CHECK_EQUAL(output.size(), size_t(5));
CHECK_RANGE_EQUAL(int, 5, output, (10, 10, 20, 20, 40));
// in-place exclusive scan
CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 1, 2, 3));
bc::exclusive_scan(input.begin(), input.end(), input.begin(),
int(10), bc::multiplies<int>(), queue);
CHECK_RANGE_EQUAL(int, 5, input, (10, 10, 20, 20, 40));
}
BOOST_AUTO_TEST_CASE(inclusive_scan_int_multiplies_long_vector)
{
size_t size = 1000;
bc::vector<int> device_vector(size, int(2), queue);
BOOST_CHECK_EQUAL(device_vector.size(), size);
bc::inclusive_scan(device_vector.begin(), device_vector.end(),
device_vector.begin(), bc::multiplies<int>(), queue);
std::vector<int> host_vector(size, 2);
BOOST_CHECK_EQUAL(host_vector.size(), size);
bc::copy(device_vector.begin(), device_vector.end(),
host_vector.begin(), queue);
std::vector<int> test(size, 2);
BOOST_CHECK_EQUAL(test.size(), size);
std::partial_sum(test.begin(), test.end(),
test.begin(), std::multiplies<int>());
BOOST_CHECK_EQUAL_COLLECTIONS(host_vector.begin(), host_vector.end(),
test.begin(), test.end());
}
BOOST_AUTO_TEST_CASE(exclusive_scan_int_multiplies_long_vector)
{
size_t size = 1000;
bc::vector<int> device_vector(size, int(2), queue);
BOOST_CHECK_EQUAL(device_vector.size(), size);
bc::exclusive_scan(device_vector.begin(), device_vector.end(),
device_vector.begin(), int(10), bc::multiplies<int>(),
queue);
std::vector<int> host_vector(size, 2);
BOOST_CHECK_EQUAL(host_vector.size(), size);
bc::copy(device_vector.begin(), device_vector.end(),
host_vector.begin(), queue);
std::vector<int> test(size, 2);
BOOST_CHECK_EQUAL(test.size(), size);
test[0] = 10;
std::partial_sum(test.begin(), test.end(),
test.begin(), std::multiplies<int>());
BOOST_CHECK_EQUAL_COLLECTIONS(host_vector.begin(), host_vector.end(),
test.begin(), test.end());
}
BOOST_AUTO_TEST_CASE(inclusive_scan_int_custom_function)
{
BOOST_COMPUTE_FUNCTION(int, multi, (int x, int y),
{
return x * y * 2;
});
int data[] = { 1, 2, 1, 2, 3 };
bc::vector<int> vector(data, data + 5, queue);
BOOST_CHECK_EQUAL(vector.size(), size_t(5));
bc::vector<int> result(5, context);
BOOST_CHECK_EQUAL(result.size(), size_t(5));
// inclusive scan
bc::inclusive_scan(vector.begin(), vector.end(), result.begin(),
multi, queue);
CHECK_RANGE_EQUAL(int, 5, result, (1, 4, 8, 32, 192));
// in-place inclusive scan
CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 1, 2, 3));
bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(),
multi, queue);
CHECK_RANGE_EQUAL(int, 5, vector, (1, 4, 8, 32, 192));
}
BOOST_AUTO_TEST_CASE(exclusive_scan_int_custom_function)
{
BOOST_COMPUTE_FUNCTION(int, multi, (int x, int y),
{
return x * y * 2;
});
int data[] = { 1, 2, 1, 2, 3 };
bc::vector<int> vector(data, data + 5, queue);
BOOST_CHECK_EQUAL(vector.size(), size_t(5));
bc::vector<int> result(5, context);
BOOST_CHECK_EQUAL(result.size(), size_t(5));
// exclusive_scan
bc::exclusive_scan(vector.begin(), vector.end(), result.begin(),
int(1), multi, queue);
CHECK_RANGE_EQUAL(int, 5, result, (1, 2, 8, 16, 64));
// in-place exclusive scan
CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 1, 2, 3));
bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(),
int(1), multi, queue);
CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 8, 16, 64));
}
BOOST_AUTO_TEST_SUITE_END()