123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374 |
- //---------------------------------------------------------------------------//
- // Copyright (c) 2016 Jakub Szuppe <j.szuppe@gmail.com>
- //
- // Distributed under the Boost Software License, Version 1.0
- // See accompanying file LICENSE_1_0.txt or copy at
- // http://www.boost.org/LICENSE_1_0.txt
- //
- // See http://boostorg.github.com/compute for more information.
- //---------------------------------------------------------------------------//
- #define BOOST_TEST_MODULE TestMergeSortOnGPU
- #include <boost/test/unit_test.hpp>
- #include <iostream>
- #include <boost/compute/system.hpp>
- #include <boost/compute/algorithm/is_sorted.hpp>
- #include <boost/compute/algorithm/detail/merge_sort_on_gpu.hpp>
- #include <boost/compute/container/vector.hpp>
- #include "quirks.hpp"
- #include "check_macros.hpp"
- #include "context_setup.hpp"
- namespace bc = boost::compute;
- BOOST_AUTO_TEST_CASE(sort_small_vector_char)
- {
- if(is_apple_cpu_device(device)) {
- std::cerr
- << "skipping all merge_sort_on_gpu tests due to Apple platform"
- << " behavior when local memory is used on a CPU device"
- << std::endl;
- return;
- }
- using boost::compute::char_;
- ::boost::compute::greater<char_> greater;
- ::boost::compute::less<char_> less;
- char_ data[] = { 'c', 'a', '0', '7', 'B', 'F', '\0', '$' };
- boost::compute::vector<char_> vector(data, data + 8, queue);
- BOOST_CHECK_EQUAL(vector.size(), size_t(8));
- BOOST_CHECK(boost::compute::is_sorted(vector.begin(), vector.end(), queue) == false);
- // <
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), less, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
- );
- CHECK_RANGE_EQUAL(char_, 8, vector, ('\0', '$', '0', '7', 'B', 'F', 'a', 'c'));
- // >
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), greater, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
- );
- CHECK_RANGE_EQUAL(char_, 8, vector, ('c', 'a', 'F', 'B', '7', '0', '$', '\0'));
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_int)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::int_;
- ::boost::compute::greater<int_> greater;
- ::boost::compute::less<int_> less;
- const int_ size = 748;
- std::vector<int_> data(size);
- for(int_ i = 0; i < size; i++){
- data[i] = i%2 ? i : -i;
- }
- boost::compute::vector<int_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
- // <
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), less, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
- );
- // >
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), greater, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_ulong)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::ulong_;
- ::boost::compute::greater<ulong_> greater;
- ::boost::compute::less<ulong_> less;
- const ulong_ size = 260;
- std::vector<ulong_> data(size);
- for(ulong_ i = 0; i < size; i++){
- data[i] = i%2 ? i : i * i;
- }
- boost::compute::vector<ulong_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
- // <
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), less, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
- );
- // >
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), greater, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_float)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::float_;
- ::boost::compute::greater<float_> greater;
- ::boost::compute::less<float_> less;
- const int size = 513;
- std::vector<float_> data(size);
- for(int i = 0; i < size; i++){
- data[i] = float_(i%2 ? i : -i);
- }
- boost::compute::vector<float_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
- // <
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), less, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
- );
- // >
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), greater, queue
- );
- queue.finish();
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_double)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- if(!device.supports_extension("cl_khr_fp64")){
- std::cout << "skipping test: device does not support double" << std::endl;
- return;
- }
- using boost::compute::double_;
- ::boost::compute::greater<double_> greater;
- ::boost::compute::less<double_> less;
- const int size = 1023;
- std::vector<double_> data(size);
- for(int i = 0; i < size; i++){
- data[i] = double_(i%2 ? i : -i);
- }
- boost::compute::vector<double_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
- // <
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), less, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
- );
- // >
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), greater, queue
- );
- queue.finish();
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_int_custom_comparison_func)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::int_;
- ::boost::compute::greater<int_> greater;
- ::boost::compute::less<int_> less;
- const int_ size = 1024;
- std::vector<int_> data(size);
- for(int_ i = 0; i < size; i++){
- data[i] = i%2 ? size - i : i - size;
- }
- BOOST_COMPUTE_FUNCTION(bool, abs_sort, (int_ a, int_ b),
- {
- return abs(a) < abs(b);
- });
- boost::compute::vector<int_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(
- !boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
- );
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), abs_sort, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_int2)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::int2_;
- using boost::compute::int_;
- ::boost::compute::greater<int2_> greater;
- ::boost::compute::less<int2_> less;
- const int_ size = 1024;
- std::vector<int2_> data(size);
- for(int_ i = 0; i < size; i++){
- data[i] = i%2 ? int2_(i, i) : int2_(i - size, i - size);
- }
- BOOST_COMPUTE_FUNCTION(bool, abs_sort, (int2_ a, int2_ b),
- {
- return abs(a.x + a.y) < abs(b.x + b.y);
- });
- boost::compute::vector<int2_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(
- !boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
- );
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), abs_sort, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(sort_mid_vector_long8)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::long8_;
- using boost::compute::long_;
- ::boost::compute::greater<long8_> greater;
- ::boost::compute::less<long8_> less;
- const long_ size = 256;
- std::vector<long8_> data(size);
- for(long_ i = 0; i < size; i++){
- data[i] = i%2 ? long8_(i) : long8_(i * i);
- }
- BOOST_COMPUTE_FUNCTION(bool, comp, (long8_ a, long8_ b),
- {
- return a.s0 < b.s3;
- });
- boost::compute::vector<long8_> vector(data.begin(), data.end(), queue);
- BOOST_CHECK_EQUAL(vector.size(), size);
- BOOST_CHECK(
- !boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
- );
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), comp, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
- );
- }
- BOOST_AUTO_TEST_CASE(stable_sort_vector_int2)
- {
- if(is_apple_cpu_device(device)) {
- return;
- }
- using boost::compute::int2_;
- int2_ data[] = {
- int2_(8, 3), int2_(5, 1),
- int2_(2, 1), int2_(6, 1),
- int2_(8, 1), int2_(7, 1),
- int2_(4, 1), int2_(8, 2)
- };
- BOOST_COMPUTE_FUNCTION(bool, comp, (int2_ a, int2_ b),
- {
- return a.x < b.x;
- });
- boost::compute::vector<int2_> vector(data, data + 8, queue);
- BOOST_CHECK_EQUAL(vector.size(), 8);
- BOOST_CHECK(
- !boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
- );
- //
- boost::compute::detail::merge_sort_on_gpu(
- vector.begin(), vector.end(), comp, true /*stable*/, queue
- );
- BOOST_CHECK(
- boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
- );
- CHECK_RANGE_EQUAL(
- int2_, 8, vector,
- (
- int2_(2, 1), int2_(4, 1),
- int2_(5, 1), int2_(6, 1),
- int2_(7, 1), int2_(8, 3),
- int2_(8, 1), int2_(8, 2)
- )
- );
- }
- BOOST_AUTO_TEST_SUITE_END()
|