diff options
Diffstat (limited to 'src/boost/libs/compute/test/test_scan.cpp')
-rw-r--r-- | src/boost/libs/compute/test/test_scan.cpp | 490 |
1 files changed, 490 insertions, 0 deletions
diff --git a/src/boost/libs/compute/test/test_scan.cpp b/src/boost/libs/compute/test/test_scan.cpp new file mode 100644 index 00000000..1504ea06 --- /dev/null +++ b/src/boost/libs/compute/test/test_scan.cpp @@ -0,0 +1,490 @@ +//---------------------------------------------------------------------------// +// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com> +// +// Distributed under the Boost Software License, Version 1.0 +// See accompanying file LICENSE_1_0.txt or copy at +// http://www.boost.org/LICENSE_1_0.txt +// +// See http://boostorg.github.com/compute for more information. +//---------------------------------------------------------------------------// + +// Undefining BOOST_COMPUTE_USE_OFFLINE_CACHE macro as we want to modify cached +// parameters for copy algorithm without any undesirable consequences (like +// saving modified values of those parameters). +#ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE + #undef BOOST_COMPUTE_USE_OFFLINE_CACHE +#endif + +#define BOOST_TEST_MODULE TestScan +#include <boost/test/unit_test.hpp> + +#include <numeric> +#include <functional> +#include <vector> + +#include <boost/compute/functional.hpp> +#include <boost/compute/lambda.hpp> +#include <boost/compute/system.hpp> +#include <boost/compute/command_queue.hpp> +#include <boost/compute/algorithm/copy.hpp> +#include <boost/compute/algorithm/exclusive_scan.hpp> +#include <boost/compute/algorithm/inclusive_scan.hpp> +#include <boost/compute/container/vector.hpp> +#include <boost/compute/iterator/counting_iterator.hpp> +#include <boost/compute/iterator/transform_iterator.hpp> + +#include "check_macros.hpp" +#include "context_setup.hpp" + +namespace bc = boost::compute; + +BOOST_AUTO_TEST_CASE(inclusive_scan_int) +{ + using boost::compute::uint_; + using boost::compute::int_; + + int_ data[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 }; + bc::vector<int_> vector(data, data + 12, queue); + BOOST_CHECK_EQUAL(vector.size(), size_t(12)); + + bc::vector<int_> result(12, context); + BOOST_CHECK_EQUAL(result.size(), size_t(12)); + + // inclusive scan + bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66)); + + // in-place inclusive scan + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11)); + bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66)); + + // scan_on_cpu + + bc::copy(data, data + 12, vector.begin(), queue); + + // make sure parallel scan_on_cpu is used, no serial_scan + std::string cache_key = + "__boost_scan_cpu_4"; + boost::shared_ptr<bc::detail::parameter_cache> parameters = + bc::detail::parameter_cache::get_global_cache(device); + + // save + uint_ map_copy_threshold = + parameters->get(cache_key, "serial_scan_threshold", 0); + // force parallel scan_on_cpu + parameters->set(cache_key, "serial_scan_threshold", 0); + + // inclusive scan + bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66)); + + // in-place inclusive scan + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11)); + bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66)); + + // restore + parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold); +} + +BOOST_AUTO_TEST_CASE(exclusive_scan_int) +{ + using boost::compute::uint_; + using boost::compute::int_; + + int_ data[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 }; + bc::vector<int_> vector(data, data + 12, queue); + BOOST_CHECK_EQUAL(vector.size(), size_t(12)); + + bc::vector<int_> result(size_t(12), int_(0), queue); + BOOST_CHECK_EQUAL(result.size(), size_t(12)); + + // exclusive scan + bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, result, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55)); + + // in-place exclusive scan + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11)); + bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55)); + + // scan_on_cpu + bc::copy(data, data + 12, vector.begin(), queue); + + // make sure parallel scan_on_cpu is used, no serial_scan + std::string cache_key = + "__boost_scan_cpu_4"; + boost::shared_ptr<bc::detail::parameter_cache> parameters = + bc::detail::parameter_cache::get_global_cache(device); + + // save + uint_ map_copy_threshold = + parameters->get(cache_key, "serial_scan_threshold", 0); + // force parallel scan_on_cpu + parameters->set(cache_key, "serial_scan_threshold", 0); + + // exclusive scan + bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, result, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55)); + + // in-place exclusive scan + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11)); + bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), queue); + CHECK_RANGE_EQUAL(int_, 12, vector, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55)); + + // restore + parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_int2) +{ + using boost::compute::int_; + using boost::compute::uint_; + using boost::compute::int2_; + + int_ data[] = { 1, 2, + 3, 4, + 5, 6, + 7, 8, + 9, 0 }; + + boost::compute::vector<int2_> input(reinterpret_cast<int2_*>(data), + reinterpret_cast<int2_*>(data) + 5, + queue); + BOOST_CHECK_EQUAL(input.size(), size_t(5)); + + boost::compute::vector<int2_> output(5, context); + boost::compute::inclusive_scan(input.begin(), input.end(), output.begin(), + queue); + CHECK_RANGE_EQUAL( + int2_, 5, output, + (int2_(1, 2), int2_(4, 6), int2_(9, 12), int2_(16, 20), int2_(25, 20)) + ); + + // scan_on_cpu + + // make sure parallel scan_on_cpu is used, no serial_scan + std::string cache_key = + "__boost_scan_cpu_8"; + boost::shared_ptr<bc::detail::parameter_cache> parameters = + bc::detail::parameter_cache::get_global_cache(device); + + // save + uint_ map_copy_threshold = + parameters->get(cache_key, "serial_scan_threshold", 0); + // force parallel scan_on_cpu + parameters->set(cache_key, "serial_scan_threshold", 0); + + boost::compute::inclusive_scan(input.begin(), input.end(), output.begin(), + queue); + CHECK_RANGE_EQUAL( + int2_, 5, output, + (int2_(1, 2), int2_(4, 6), int2_(9, 12), int2_(16, 20), int2_(25, 20)) + ); + + // restore + parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_counting_iterator) +{ + using boost::compute::int_; + using boost::compute::uint_; + + bc::vector<int_> result(10, context); + bc::inclusive_scan(bc::make_counting_iterator(1), + bc::make_counting_iterator(11), + result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 10, result, (1, 3, 6, 10, 15, 21, 28, 36, 45, 55)); + + // scan_on_cpu + + // make sure parallel scan_on_cpu is used, no serial_scan + std::string cache_key = + "__boost_scan_cpu_4"; + boost::shared_ptr<bc::detail::parameter_cache> parameters = + bc::detail::parameter_cache::get_global_cache(device); + + // save + uint_ map_copy_threshold = + parameters->get(cache_key, "serial_scan_threshold", 0); + // force parallel scan_on_cpu + parameters->set(cache_key, "serial_scan_threshold", 0); + + bc::inclusive_scan(bc::make_counting_iterator(1), + bc::make_counting_iterator(11), + result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 10, result, (1, 3, 6, 10, 15, 21, 28, 36, 45, 55)); + + // restore + parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold); +} + +BOOST_AUTO_TEST_CASE(exclusive_scan_counting_iterator) +{ + using boost::compute::int_; + using boost::compute::uint_; + + bc::vector<int_> result(10, context); + bc::exclusive_scan(bc::make_counting_iterator(1), + bc::make_counting_iterator(11), + result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 10, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45)); + + // scan_on_cpu + + // make sure parallel scan_on_cpu is used, no serial_scan + std::string cache_key = + "__boost_scan_cpu_4"; + boost::shared_ptr<bc::detail::parameter_cache> parameters = + bc::detail::parameter_cache::get_global_cache(device); + + // save + uint_ map_copy_threshold = + parameters->get(cache_key, "serial_scan_threshold", 0); + // force parallel scan_on_cpu + parameters->set(cache_key, "serial_scan_threshold", 0); + + bc::exclusive_scan(bc::make_counting_iterator(1), + bc::make_counting_iterator(11), + result.begin(), queue); + CHECK_RANGE_EQUAL(int_, 10, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45)); + + // restore + parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_transform_iterator) +{ + float data[] = { 1.0f, 2.0f, 3.0f, 4.0f, 5.0f }; + bc::vector<float> input(data, data + 5, queue); + bc::vector<float> output(5, context); + + // normal inclusive scan of the input + bc::inclusive_scan(input.begin(), input.end(), output.begin(), queue); + queue.finish(); + BOOST_CHECK_CLOSE(float(output[0]), 1.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[1]), 3.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[2]), 6.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[3]), 10.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[4]), 15.0f, 1e-4f); + + // inclusive scan of squares of the input + using ::boost::compute::_1; + + bc::inclusive_scan(bc::make_transform_iterator(input.begin(), pown(_1, 2)), + bc::make_transform_iterator(input.end(), pown(_1, 2)), + output.begin(), queue); + queue.finish(); + BOOST_CHECK_CLOSE(float(output[0]), 1.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[1]), 5.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[2]), 14.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[3]), 30.0f, 1e-4f); + BOOST_CHECK_CLOSE(float(output[4]), 55.0f, 1e-4f); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_doctest) +{ +//! [inclusive_scan_int] +// setup input +int data[] = { 1, 2, 3, 4 }; +boost::compute::vector<int> input(data, data + 4, queue); + +// setup output +boost::compute::vector<int> output(4, context); + +// scan values +boost::compute::inclusive_scan( + input.begin(), input.end(), output.begin(), queue +); + +// output = [ 1, 3, 6, 10 ] +//! [inclusive_scan_int] + + CHECK_RANGE_EQUAL(int, 4, output, (1, 3, 6, 10)); +} + +BOOST_AUTO_TEST_CASE(exclusive_scan_doctest) +{ +//! [exclusive_scan_int] +// setup input +int data[] = { 1, 2, 3, 4 }; +boost::compute::vector<int> input(data, data + 4, queue); + +// setup output +boost::compute::vector<int> output(4, context); + +// scan values +boost::compute::exclusive_scan( + input.begin(), input.end(), output.begin(), queue +); + +// output = [ 0, 1, 3, 6 ] +//! [exclusive_scan_int] + + CHECK_RANGE_EQUAL(int, 4, output, (0, 1, 3, 6)); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_int_multiplies) +{ +//! [inclusive_scan_int_multiplies] +// setup input +int data[] = { 1, 2, 1, 2, 3 }; +boost::compute::vector<int> input(data, data + 5, queue); + +// setup output +boost::compute::vector<int> output(5, context); + +// inclusive scan with multiplication +boost::compute::inclusive_scan( + input.begin(), input.end(), output.begin(), + boost::compute::multiplies<int>(), queue +); + +// output = [1, 2, 2, 4, 12] +//! [inclusive_scan_int_multiplies] + + BOOST_CHECK_EQUAL(input.size(), size_t(5)); + BOOST_CHECK_EQUAL(output.size(), size_t(5)); + + CHECK_RANGE_EQUAL(int, 5, output, (1, 2, 2, 4, 12)); + + // in-place inclusive scan + CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 1, 2, 3)); + boost::compute::inclusive_scan(input.begin(), input.end(), input.begin(), + boost::compute::multiplies<int>(), queue); + CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 2, 4, 12)); +} + +BOOST_AUTO_TEST_CASE(exclusive_scan_int_multiplies) +{ +//! [exclusive_scan_int_multiplies] +// setup input +int data[] = { 1, 2, 1, 2, 3 }; +boost::compute::vector<int> input(data, data + 5, queue); + +// setup output +boost::compute::vector<int> output(5, context); + +// exclusive_scan with multiplication +// initial value equals 10 +boost::compute::exclusive_scan( + input.begin(), input.end(), output.begin(), + int(10), boost::compute::multiplies<int>(), queue +); + +// output = [10, 10, 20, 20, 40] +//! [exclusive_scan_int_multiplies] + + BOOST_CHECK_EQUAL(input.size(), size_t(5)); + BOOST_CHECK_EQUAL(output.size(), size_t(5)); + + CHECK_RANGE_EQUAL(int, 5, output, (10, 10, 20, 20, 40)); + + // in-place exclusive scan + CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 1, 2, 3)); + bc::exclusive_scan(input.begin(), input.end(), input.begin(), + int(10), bc::multiplies<int>(), queue); + CHECK_RANGE_EQUAL(int, 5, input, (10, 10, 20, 20, 40)); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_int_multiplies_long_vector) +{ + size_t size = 1000; + bc::vector<int> device_vector(size, int(2), queue); + BOOST_CHECK_EQUAL(device_vector.size(), size); + bc::inclusive_scan(device_vector.begin(), device_vector.end(), + device_vector.begin(), bc::multiplies<int>(), queue); + + std::vector<int> host_vector(size, 2); + BOOST_CHECK_EQUAL(host_vector.size(), size); + bc::copy(device_vector.begin(), device_vector.end(), + host_vector.begin(), queue); + + std::vector<int> test(size, 2); + BOOST_CHECK_EQUAL(test.size(), size); + std::partial_sum(test.begin(), test.end(), + test.begin(), std::multiplies<int>()); + + BOOST_CHECK_EQUAL_COLLECTIONS(host_vector.begin(), host_vector.end(), + test.begin(), test.end()); +} + +BOOST_AUTO_TEST_CASE(exclusive_scan_int_multiplies_long_vector) +{ + size_t size = 1000; + bc::vector<int> device_vector(size, int(2), queue); + BOOST_CHECK_EQUAL(device_vector.size(), size); + bc::exclusive_scan(device_vector.begin(), device_vector.end(), + device_vector.begin(), int(10), bc::multiplies<int>(), + queue); + + std::vector<int> host_vector(size, 2); + BOOST_CHECK_EQUAL(host_vector.size(), size); + bc::copy(device_vector.begin(), device_vector.end(), + host_vector.begin(), queue); + + std::vector<int> test(size, 2); + BOOST_CHECK_EQUAL(test.size(), size); + test[0] = 10; + std::partial_sum(test.begin(), test.end(), + test.begin(), std::multiplies<int>()); + + BOOST_CHECK_EQUAL_COLLECTIONS(host_vector.begin(), host_vector.end(), + test.begin(), test.end()); +} + +BOOST_AUTO_TEST_CASE(inclusive_scan_int_custom_function) +{ + BOOST_COMPUTE_FUNCTION(int, multi, (int x, int y), + { + return x * y * 2; + }); + + int data[] = { 1, 2, 1, 2, 3 }; + bc::vector<int> vector(data, data + 5, queue); + BOOST_CHECK_EQUAL(vector.size(), size_t(5)); + + bc::vector<int> result(5, context); + BOOST_CHECK_EQUAL(result.size(), size_t(5)); + + // inclusive scan + bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), + multi, queue); + CHECK_RANGE_EQUAL(int, 5, result, (1, 4, 8, 32, 192)); + + // in-place inclusive scan + CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 1, 2, 3)); + bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), + multi, queue); + CHECK_RANGE_EQUAL(int, 5, vector, (1, 4, 8, 32, 192)); +} + +BOOST_AUTO_TEST_CASE(exclusive_scan_int_custom_function) +{ + BOOST_COMPUTE_FUNCTION(int, multi, (int x, int y), + { + return x * y * 2; + }); + + int data[] = { 1, 2, 1, 2, 3 }; + bc::vector<int> vector(data, data + 5, queue); + BOOST_CHECK_EQUAL(vector.size(), size_t(5)); + + bc::vector<int> result(5, context); + BOOST_CHECK_EQUAL(result.size(), size_t(5)); + + // exclusive_scan + bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), + int(1), multi, queue); + CHECK_RANGE_EQUAL(int, 5, result, (1, 2, 8, 16, 64)); + + // in-place exclusive scan + CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 1, 2, 3)); + bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), + int(1), multi, queue); + CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 8, 16, 64)); +} + +BOOST_AUTO_TEST_SUITE_END() |