summaryrefslogtreecommitdiffstats
path: root/src/boost/libs/compute/test/test_scan.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/boost/libs/compute/test/test_scan.cpp')
-rw-r--r--src/boost/libs/compute/test/test_scan.cpp490
1 files changed, 490 insertions, 0 deletions
diff --git a/src/boost/libs/compute/test/test_scan.cpp b/src/boost/libs/compute/test/test_scan.cpp
new file mode 100644
index 00000000..1504ea06
--- /dev/null
+++ b/src/boost/libs/compute/test/test_scan.cpp
@@ -0,0 +1,490 @@
+//---------------------------------------------------------------------------//
+// Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
+//
+// Distributed under the Boost Software License, Version 1.0
+// See accompanying file LICENSE_1_0.txt or copy at
+// http://www.boost.org/LICENSE_1_0.txt
+//
+// See http://boostorg.github.com/compute for more information.
+//---------------------------------------------------------------------------//
+
+// Undefining BOOST_COMPUTE_USE_OFFLINE_CACHE macro as we want to modify cached
+// parameters for copy algorithm without any undesirable consequences (like
+// saving modified values of those parameters).
+#ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE
+ #undef BOOST_COMPUTE_USE_OFFLINE_CACHE
+#endif
+
+#define BOOST_TEST_MODULE TestScan
+#include <boost/test/unit_test.hpp>
+
+#include <numeric>
+#include <functional>
+#include <vector>
+
+#include <boost/compute/functional.hpp>
+#include <boost/compute/lambda.hpp>
+#include <boost/compute/system.hpp>
+#include <boost/compute/command_queue.hpp>
+#include <boost/compute/algorithm/copy.hpp>
+#include <boost/compute/algorithm/exclusive_scan.hpp>
+#include <boost/compute/algorithm/inclusive_scan.hpp>
+#include <boost/compute/container/vector.hpp>
+#include <boost/compute/iterator/counting_iterator.hpp>
+#include <boost/compute/iterator/transform_iterator.hpp>
+
+#include "check_macros.hpp"
+#include "context_setup.hpp"
+
+namespace bc = boost::compute;
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_int)
+{
+ using boost::compute::uint_;
+ using boost::compute::int_;
+
+ int_ data[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 };
+ bc::vector<int_> vector(data, data + 12, queue);
+ BOOST_CHECK_EQUAL(vector.size(), size_t(12));
+
+ bc::vector<int_> result(12, context);
+ BOOST_CHECK_EQUAL(result.size(), size_t(12));
+
+ // inclusive scan
+ bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
+
+ // in-place inclusive scan
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
+ bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
+
+ // scan_on_cpu
+
+ bc::copy(data, data + 12, vector.begin(), queue);
+
+ // make sure parallel scan_on_cpu is used, no serial_scan
+ std::string cache_key =
+ "__boost_scan_cpu_4";
+ boost::shared_ptr<bc::detail::parameter_cache> parameters =
+ bc::detail::parameter_cache::get_global_cache(device);
+
+ // save
+ uint_ map_copy_threshold =
+ parameters->get(cache_key, "serial_scan_threshold", 0);
+ // force parallel scan_on_cpu
+ parameters->set(cache_key, "serial_scan_threshold", 0);
+
+ // inclusive scan
+ bc::inclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
+
+ // in-place inclusive scan
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
+ bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55, 66));
+
+ // restore
+ parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
+}
+
+BOOST_AUTO_TEST_CASE(exclusive_scan_int)
+{
+ using boost::compute::uint_;
+ using boost::compute::int_;
+
+ int_ data[] = { 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11 };
+ bc::vector<int_> vector(data, data + 12, queue);
+ BOOST_CHECK_EQUAL(vector.size(), size_t(12));
+
+ bc::vector<int_> result(size_t(12), int_(0), queue);
+ BOOST_CHECK_EQUAL(result.size(), size_t(12));
+
+ // exclusive scan
+ bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, result, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
+
+ // in-place exclusive scan
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
+ bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
+
+ // scan_on_cpu
+ bc::copy(data, data + 12, vector.begin(), queue);
+
+ // make sure parallel scan_on_cpu is used, no serial_scan
+ std::string cache_key =
+ "__boost_scan_cpu_4";
+ boost::shared_ptr<bc::detail::parameter_cache> parameters =
+ bc::detail::parameter_cache::get_global_cache(device);
+
+ // save
+ uint_ map_copy_threshold =
+ parameters->get(cache_key, "serial_scan_threshold", 0);
+ // force parallel scan_on_cpu
+ parameters->set(cache_key, "serial_scan_threshold", 0);
+
+ // exclusive scan
+ bc::exclusive_scan(vector.begin(), vector.end(), result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, result, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
+
+ // in-place exclusive scan
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11));
+ bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 12, vector, (0, 0, 1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
+
+ // restore
+ parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_int2)
+{
+ using boost::compute::int_;
+ using boost::compute::uint_;
+ using boost::compute::int2_;
+
+ int_ data[] = { 1, 2,
+ 3, 4,
+ 5, 6,
+ 7, 8,
+ 9, 0 };
+
+ boost::compute::vector<int2_> input(reinterpret_cast<int2_*>(data),
+ reinterpret_cast<int2_*>(data) + 5,
+ queue);
+ BOOST_CHECK_EQUAL(input.size(), size_t(5));
+
+ boost::compute::vector<int2_> output(5, context);
+ boost::compute::inclusive_scan(input.begin(), input.end(), output.begin(),
+ queue);
+ CHECK_RANGE_EQUAL(
+ int2_, 5, output,
+ (int2_(1, 2), int2_(4, 6), int2_(9, 12), int2_(16, 20), int2_(25, 20))
+ );
+
+ // scan_on_cpu
+
+ // make sure parallel scan_on_cpu is used, no serial_scan
+ std::string cache_key =
+ "__boost_scan_cpu_8";
+ boost::shared_ptr<bc::detail::parameter_cache> parameters =
+ bc::detail::parameter_cache::get_global_cache(device);
+
+ // save
+ uint_ map_copy_threshold =
+ parameters->get(cache_key, "serial_scan_threshold", 0);
+ // force parallel scan_on_cpu
+ parameters->set(cache_key, "serial_scan_threshold", 0);
+
+ boost::compute::inclusive_scan(input.begin(), input.end(), output.begin(),
+ queue);
+ CHECK_RANGE_EQUAL(
+ int2_, 5, output,
+ (int2_(1, 2), int2_(4, 6), int2_(9, 12), int2_(16, 20), int2_(25, 20))
+ );
+
+ // restore
+ parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_counting_iterator)
+{
+ using boost::compute::int_;
+ using boost::compute::uint_;
+
+ bc::vector<int_> result(10, context);
+ bc::inclusive_scan(bc::make_counting_iterator(1),
+ bc::make_counting_iterator(11),
+ result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 10, result, (1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
+
+ // scan_on_cpu
+
+ // make sure parallel scan_on_cpu is used, no serial_scan
+ std::string cache_key =
+ "__boost_scan_cpu_4";
+ boost::shared_ptr<bc::detail::parameter_cache> parameters =
+ bc::detail::parameter_cache::get_global_cache(device);
+
+ // save
+ uint_ map_copy_threshold =
+ parameters->get(cache_key, "serial_scan_threshold", 0);
+ // force parallel scan_on_cpu
+ parameters->set(cache_key, "serial_scan_threshold", 0);
+
+ bc::inclusive_scan(bc::make_counting_iterator(1),
+ bc::make_counting_iterator(11),
+ result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 10, result, (1, 3, 6, 10, 15, 21, 28, 36, 45, 55));
+
+ // restore
+ parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
+}
+
+BOOST_AUTO_TEST_CASE(exclusive_scan_counting_iterator)
+{
+ using boost::compute::int_;
+ using boost::compute::uint_;
+
+ bc::vector<int_> result(10, context);
+ bc::exclusive_scan(bc::make_counting_iterator(1),
+ bc::make_counting_iterator(11),
+ result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 10, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45));
+
+ // scan_on_cpu
+
+ // make sure parallel scan_on_cpu is used, no serial_scan
+ std::string cache_key =
+ "__boost_scan_cpu_4";
+ boost::shared_ptr<bc::detail::parameter_cache> parameters =
+ bc::detail::parameter_cache::get_global_cache(device);
+
+ // save
+ uint_ map_copy_threshold =
+ parameters->get(cache_key, "serial_scan_threshold", 0);
+ // force parallel scan_on_cpu
+ parameters->set(cache_key, "serial_scan_threshold", 0);
+
+ bc::exclusive_scan(bc::make_counting_iterator(1),
+ bc::make_counting_iterator(11),
+ result.begin(), queue);
+ CHECK_RANGE_EQUAL(int_, 10, result, (0, 1, 3, 6, 10, 15, 21, 28, 36, 45));
+
+ // restore
+ parameters->set(cache_key, "serial_scan_threshold", map_copy_threshold);
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_transform_iterator)
+{
+ float data[] = { 1.0f, 2.0f, 3.0f, 4.0f, 5.0f };
+ bc::vector<float> input(data, data + 5, queue);
+ bc::vector<float> output(5, context);
+
+ // normal inclusive scan of the input
+ bc::inclusive_scan(input.begin(), input.end(), output.begin(), queue);
+ queue.finish();
+ BOOST_CHECK_CLOSE(float(output[0]), 1.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[1]), 3.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[2]), 6.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[3]), 10.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[4]), 15.0f, 1e-4f);
+
+ // inclusive scan of squares of the input
+ using ::boost::compute::_1;
+
+ bc::inclusive_scan(bc::make_transform_iterator(input.begin(), pown(_1, 2)),
+ bc::make_transform_iterator(input.end(), pown(_1, 2)),
+ output.begin(), queue);
+ queue.finish();
+ BOOST_CHECK_CLOSE(float(output[0]), 1.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[1]), 5.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[2]), 14.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[3]), 30.0f, 1e-4f);
+ BOOST_CHECK_CLOSE(float(output[4]), 55.0f, 1e-4f);
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_doctest)
+{
+//! [inclusive_scan_int]
+// setup input
+int data[] = { 1, 2, 3, 4 };
+boost::compute::vector<int> input(data, data + 4, queue);
+
+// setup output
+boost::compute::vector<int> output(4, context);
+
+// scan values
+boost::compute::inclusive_scan(
+ input.begin(), input.end(), output.begin(), queue
+);
+
+// output = [ 1, 3, 6, 10 ]
+//! [inclusive_scan_int]
+
+ CHECK_RANGE_EQUAL(int, 4, output, (1, 3, 6, 10));
+}
+
+BOOST_AUTO_TEST_CASE(exclusive_scan_doctest)
+{
+//! [exclusive_scan_int]
+// setup input
+int data[] = { 1, 2, 3, 4 };
+boost::compute::vector<int> input(data, data + 4, queue);
+
+// setup output
+boost::compute::vector<int> output(4, context);
+
+// scan values
+boost::compute::exclusive_scan(
+ input.begin(), input.end(), output.begin(), queue
+);
+
+// output = [ 0, 1, 3, 6 ]
+//! [exclusive_scan_int]
+
+ CHECK_RANGE_EQUAL(int, 4, output, (0, 1, 3, 6));
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_int_multiplies)
+{
+//! [inclusive_scan_int_multiplies]
+// setup input
+int data[] = { 1, 2, 1, 2, 3 };
+boost::compute::vector<int> input(data, data + 5, queue);
+
+// setup output
+boost::compute::vector<int> output(5, context);
+
+// inclusive scan with multiplication
+boost::compute::inclusive_scan(
+ input.begin(), input.end(), output.begin(),
+ boost::compute::multiplies<int>(), queue
+);
+
+// output = [1, 2, 2, 4, 12]
+//! [inclusive_scan_int_multiplies]
+
+ BOOST_CHECK_EQUAL(input.size(), size_t(5));
+ BOOST_CHECK_EQUAL(output.size(), size_t(5));
+
+ CHECK_RANGE_EQUAL(int, 5, output, (1, 2, 2, 4, 12));
+
+ // in-place inclusive scan
+ CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 1, 2, 3));
+ boost::compute::inclusive_scan(input.begin(), input.end(), input.begin(),
+ boost::compute::multiplies<int>(), queue);
+ CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 2, 4, 12));
+}
+
+BOOST_AUTO_TEST_CASE(exclusive_scan_int_multiplies)
+{
+//! [exclusive_scan_int_multiplies]
+// setup input
+int data[] = { 1, 2, 1, 2, 3 };
+boost::compute::vector<int> input(data, data + 5, queue);
+
+// setup output
+boost::compute::vector<int> output(5, context);
+
+// exclusive_scan with multiplication
+// initial value equals 10
+boost::compute::exclusive_scan(
+ input.begin(), input.end(), output.begin(),
+ int(10), boost::compute::multiplies<int>(), queue
+);
+
+// output = [10, 10, 20, 20, 40]
+//! [exclusive_scan_int_multiplies]
+
+ BOOST_CHECK_EQUAL(input.size(), size_t(5));
+ BOOST_CHECK_EQUAL(output.size(), size_t(5));
+
+ CHECK_RANGE_EQUAL(int, 5, output, (10, 10, 20, 20, 40));
+
+ // in-place exclusive scan
+ CHECK_RANGE_EQUAL(int, 5, input, (1, 2, 1, 2, 3));
+ bc::exclusive_scan(input.begin(), input.end(), input.begin(),
+ int(10), bc::multiplies<int>(), queue);
+ CHECK_RANGE_EQUAL(int, 5, input, (10, 10, 20, 20, 40));
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_int_multiplies_long_vector)
+{
+ size_t size = 1000;
+ bc::vector<int> device_vector(size, int(2), queue);
+ BOOST_CHECK_EQUAL(device_vector.size(), size);
+ bc::inclusive_scan(device_vector.begin(), device_vector.end(),
+ device_vector.begin(), bc::multiplies<int>(), queue);
+
+ std::vector<int> host_vector(size, 2);
+ BOOST_CHECK_EQUAL(host_vector.size(), size);
+ bc::copy(device_vector.begin(), device_vector.end(),
+ host_vector.begin(), queue);
+
+ std::vector<int> test(size, 2);
+ BOOST_CHECK_EQUAL(test.size(), size);
+ std::partial_sum(test.begin(), test.end(),
+ test.begin(), std::multiplies<int>());
+
+ BOOST_CHECK_EQUAL_COLLECTIONS(host_vector.begin(), host_vector.end(),
+ test.begin(), test.end());
+}
+
+BOOST_AUTO_TEST_CASE(exclusive_scan_int_multiplies_long_vector)
+{
+ size_t size = 1000;
+ bc::vector<int> device_vector(size, int(2), queue);
+ BOOST_CHECK_EQUAL(device_vector.size(), size);
+ bc::exclusive_scan(device_vector.begin(), device_vector.end(),
+ device_vector.begin(), int(10), bc::multiplies<int>(),
+ queue);
+
+ std::vector<int> host_vector(size, 2);
+ BOOST_CHECK_EQUAL(host_vector.size(), size);
+ bc::copy(device_vector.begin(), device_vector.end(),
+ host_vector.begin(), queue);
+
+ std::vector<int> test(size, 2);
+ BOOST_CHECK_EQUAL(test.size(), size);
+ test[0] = 10;
+ std::partial_sum(test.begin(), test.end(),
+ test.begin(), std::multiplies<int>());
+
+ BOOST_CHECK_EQUAL_COLLECTIONS(host_vector.begin(), host_vector.end(),
+ test.begin(), test.end());
+}
+
+BOOST_AUTO_TEST_CASE(inclusive_scan_int_custom_function)
+{
+ BOOST_COMPUTE_FUNCTION(int, multi, (int x, int y),
+ {
+ return x * y * 2;
+ });
+
+ int data[] = { 1, 2, 1, 2, 3 };
+ bc::vector<int> vector(data, data + 5, queue);
+ BOOST_CHECK_EQUAL(vector.size(), size_t(5));
+
+ bc::vector<int> result(5, context);
+ BOOST_CHECK_EQUAL(result.size(), size_t(5));
+
+ // inclusive scan
+ bc::inclusive_scan(vector.begin(), vector.end(), result.begin(),
+ multi, queue);
+ CHECK_RANGE_EQUAL(int, 5, result, (1, 4, 8, 32, 192));
+
+ // in-place inclusive scan
+ CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 1, 2, 3));
+ bc::inclusive_scan(vector.begin(), vector.end(), vector.begin(),
+ multi, queue);
+ CHECK_RANGE_EQUAL(int, 5, vector, (1, 4, 8, 32, 192));
+}
+
+BOOST_AUTO_TEST_CASE(exclusive_scan_int_custom_function)
+{
+ BOOST_COMPUTE_FUNCTION(int, multi, (int x, int y),
+ {
+ return x * y * 2;
+ });
+
+ int data[] = { 1, 2, 1, 2, 3 };
+ bc::vector<int> vector(data, data + 5, queue);
+ BOOST_CHECK_EQUAL(vector.size(), size_t(5));
+
+ bc::vector<int> result(5, context);
+ BOOST_CHECK_EQUAL(result.size(), size_t(5));
+
+ // exclusive_scan
+ bc::exclusive_scan(vector.begin(), vector.end(), result.begin(),
+ int(1), multi, queue);
+ CHECK_RANGE_EQUAL(int, 5, result, (1, 2, 8, 16, 64));
+
+ // in-place exclusive scan
+ CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 1, 2, 3));
+ bc::exclusive_scan(vector.begin(), vector.end(), vector.begin(),
+ int(1), multi, queue);
+ CHECK_RANGE_EQUAL(int, 5, vector, (1, 2, 8, 16, 64));
+}
+
+BOOST_AUTO_TEST_SUITE_END()