test_merge_sort_gpu.cpp 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374
  1. //---------------------------------------------------------------------------//
  2. // Copyright (c) 2016 Jakub Szuppe <j.szuppe@gmail.com>
  3. //
  4. // Distributed under the Boost Software License, Version 1.0
  5. // See accompanying file LICENSE_1_0.txt or copy at
  6. // http://www.boost.org/LICENSE_1_0.txt
  7. //
  8. // See http://boostorg.github.com/compute for more information.
  9. //---------------------------------------------------------------------------//
  10. #define BOOST_TEST_MODULE TestMergeSortOnGPU
  11. #include <boost/test/unit_test.hpp>
  12. #include <iostream>
  13. #include <boost/compute/system.hpp>
  14. #include <boost/compute/algorithm/is_sorted.hpp>
  15. #include <boost/compute/algorithm/detail/merge_sort_on_gpu.hpp>
  16. #include <boost/compute/container/vector.hpp>
  17. #include "quirks.hpp"
  18. #include "check_macros.hpp"
  19. #include "context_setup.hpp"
  20. namespace bc = boost::compute;
  21. BOOST_AUTO_TEST_CASE(sort_small_vector_char)
  22. {
  23. if(is_apple_cpu_device(device)) {
  24. std::cerr
  25. << "skipping all merge_sort_on_gpu tests due to Apple platform"
  26. << " behavior when local memory is used on a CPU device"
  27. << std::endl;
  28. return;
  29. }
  30. using boost::compute::char_;
  31. ::boost::compute::greater<char_> greater;
  32. ::boost::compute::less<char_> less;
  33. char_ data[] = { 'c', 'a', '0', '7', 'B', 'F', '\0', '$' };
  34. boost::compute::vector<char_> vector(data, data + 8, queue);
  35. BOOST_CHECK_EQUAL(vector.size(), size_t(8));
  36. BOOST_CHECK(boost::compute::is_sorted(vector.begin(), vector.end(), queue) == false);
  37. // <
  38. boost::compute::detail::merge_sort_on_gpu(
  39. vector.begin(), vector.end(), less, queue
  40. );
  41. BOOST_CHECK(
  42. boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
  43. );
  44. CHECK_RANGE_EQUAL(char_, 8, vector, ('\0', '$', '0', '7', 'B', 'F', 'a', 'c'));
  45. // >
  46. boost::compute::detail::merge_sort_on_gpu(
  47. vector.begin(), vector.end(), greater, queue
  48. );
  49. BOOST_CHECK(
  50. boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
  51. );
  52. CHECK_RANGE_EQUAL(char_, 8, vector, ('c', 'a', 'F', 'B', '7', '0', '$', '\0'));
  53. }
  54. BOOST_AUTO_TEST_CASE(sort_mid_vector_int)
  55. {
  56. if(is_apple_cpu_device(device)) {
  57. return;
  58. }
  59. using boost::compute::int_;
  60. ::boost::compute::greater<int_> greater;
  61. ::boost::compute::less<int_> less;
  62. const int_ size = 748;
  63. std::vector<int_> data(size);
  64. for(int_ i = 0; i < size; i++){
  65. data[i] = i%2 ? i : -i;
  66. }
  67. boost::compute::vector<int_> vector(data.begin(), data.end(), queue);
  68. BOOST_CHECK_EQUAL(vector.size(), size);
  69. BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
  70. // <
  71. boost::compute::detail::merge_sort_on_gpu(
  72. vector.begin(), vector.end(), less, queue
  73. );
  74. BOOST_CHECK(
  75. boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
  76. );
  77. // >
  78. boost::compute::detail::merge_sort_on_gpu(
  79. vector.begin(), vector.end(), greater, queue
  80. );
  81. BOOST_CHECK(
  82. boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
  83. );
  84. }
  85. BOOST_AUTO_TEST_CASE(sort_mid_vector_ulong)
  86. {
  87. if(is_apple_cpu_device(device)) {
  88. return;
  89. }
  90. using boost::compute::ulong_;
  91. ::boost::compute::greater<ulong_> greater;
  92. ::boost::compute::less<ulong_> less;
  93. const ulong_ size = 260;
  94. std::vector<ulong_> data(size);
  95. for(ulong_ i = 0; i < size; i++){
  96. data[i] = i%2 ? i : i * i;
  97. }
  98. boost::compute::vector<ulong_> vector(data.begin(), data.end(), queue);
  99. BOOST_CHECK_EQUAL(vector.size(), size);
  100. BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
  101. // <
  102. boost::compute::detail::merge_sort_on_gpu(
  103. vector.begin(), vector.end(), less, queue
  104. );
  105. BOOST_CHECK(
  106. boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
  107. );
  108. // >
  109. boost::compute::detail::merge_sort_on_gpu(
  110. vector.begin(), vector.end(), greater, queue
  111. );
  112. BOOST_CHECK(
  113. boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
  114. );
  115. }
  116. BOOST_AUTO_TEST_CASE(sort_mid_vector_float)
  117. {
  118. if(is_apple_cpu_device(device)) {
  119. return;
  120. }
  121. using boost::compute::float_;
  122. ::boost::compute::greater<float_> greater;
  123. ::boost::compute::less<float_> less;
  124. const int size = 513;
  125. std::vector<float_> data(size);
  126. for(int i = 0; i < size; i++){
  127. data[i] = float_(i%2 ? i : -i);
  128. }
  129. boost::compute::vector<float_> vector(data.begin(), data.end(), queue);
  130. BOOST_CHECK_EQUAL(vector.size(), size);
  131. BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
  132. // <
  133. boost::compute::detail::merge_sort_on_gpu(
  134. vector.begin(), vector.end(), less, queue
  135. );
  136. BOOST_CHECK(
  137. boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
  138. );
  139. // >
  140. boost::compute::detail::merge_sort_on_gpu(
  141. vector.begin(), vector.end(), greater, queue
  142. );
  143. queue.finish();
  144. BOOST_CHECK(
  145. boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
  146. );
  147. }
  148. BOOST_AUTO_TEST_CASE(sort_mid_vector_double)
  149. {
  150. if(is_apple_cpu_device(device)) {
  151. return;
  152. }
  153. if(!device.supports_extension("cl_khr_fp64")){
  154. std::cout << "skipping test: device does not support double" << std::endl;
  155. return;
  156. }
  157. using boost::compute::double_;
  158. ::boost::compute::greater<double_> greater;
  159. ::boost::compute::less<double_> less;
  160. const int size = 1023;
  161. std::vector<double_> data(size);
  162. for(int i = 0; i < size; i++){
  163. data[i] = double_(i%2 ? i : -i);
  164. }
  165. boost::compute::vector<double_> vector(data.begin(), data.end(), queue);
  166. BOOST_CHECK_EQUAL(vector.size(), size);
  167. BOOST_CHECK(!boost::compute::is_sorted(vector.begin(), vector.end(), queue));
  168. // <
  169. boost::compute::detail::merge_sort_on_gpu(
  170. vector.begin(), vector.end(), less, queue
  171. );
  172. BOOST_CHECK(
  173. boost::compute::is_sorted(vector.begin(), vector.end(), less, queue)
  174. );
  175. // >
  176. boost::compute::detail::merge_sort_on_gpu(
  177. vector.begin(), vector.end(), greater, queue
  178. );
  179. queue.finish();
  180. BOOST_CHECK(
  181. boost::compute::is_sorted(vector.begin(), vector.end(), greater, queue)
  182. );
  183. }
  184. BOOST_AUTO_TEST_CASE(sort_mid_vector_int_custom_comparison_func)
  185. {
  186. if(is_apple_cpu_device(device)) {
  187. return;
  188. }
  189. using boost::compute::int_;
  190. ::boost::compute::greater<int_> greater;
  191. ::boost::compute::less<int_> less;
  192. const int_ size = 1024;
  193. std::vector<int_> data(size);
  194. for(int_ i = 0; i < size; i++){
  195. data[i] = i%2 ? size - i : i - size;
  196. }
  197. BOOST_COMPUTE_FUNCTION(bool, abs_sort, (int_ a, int_ b),
  198. {
  199. return abs(a) < abs(b);
  200. });
  201. boost::compute::vector<int_> vector(data.begin(), data.end(), queue);
  202. BOOST_CHECK_EQUAL(vector.size(), size);
  203. BOOST_CHECK(
  204. !boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
  205. );
  206. boost::compute::detail::merge_sort_on_gpu(
  207. vector.begin(), vector.end(), abs_sort, queue
  208. );
  209. BOOST_CHECK(
  210. boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
  211. );
  212. }
  213. BOOST_AUTO_TEST_CASE(sort_mid_vector_int2)
  214. {
  215. if(is_apple_cpu_device(device)) {
  216. return;
  217. }
  218. using boost::compute::int2_;
  219. using boost::compute::int_;
  220. ::boost::compute::greater<int2_> greater;
  221. ::boost::compute::less<int2_> less;
  222. const int_ size = 1024;
  223. std::vector<int2_> data(size);
  224. for(int_ i = 0; i < size; i++){
  225. data[i] = i%2 ? int2_(i, i) : int2_(i - size, i - size);
  226. }
  227. BOOST_COMPUTE_FUNCTION(bool, abs_sort, (int2_ a, int2_ b),
  228. {
  229. return abs(a.x + a.y) < abs(b.x + b.y);
  230. });
  231. boost::compute::vector<int2_> vector(data.begin(), data.end(), queue);
  232. BOOST_CHECK_EQUAL(vector.size(), size);
  233. BOOST_CHECK(
  234. !boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
  235. );
  236. boost::compute::detail::merge_sort_on_gpu(
  237. vector.begin(), vector.end(), abs_sort, queue
  238. );
  239. BOOST_CHECK(
  240. boost::compute::is_sorted(vector.begin(), vector.end(), abs_sort, queue)
  241. );
  242. }
  243. BOOST_AUTO_TEST_CASE(sort_mid_vector_long8)
  244. {
  245. if(is_apple_cpu_device(device)) {
  246. return;
  247. }
  248. using boost::compute::long8_;
  249. using boost::compute::long_;
  250. ::boost::compute::greater<long8_> greater;
  251. ::boost::compute::less<long8_> less;
  252. const long_ size = 256;
  253. std::vector<long8_> data(size);
  254. for(long_ i = 0; i < size; i++){
  255. data[i] = i%2 ? long8_(i) : long8_(i * i);
  256. }
  257. BOOST_COMPUTE_FUNCTION(bool, comp, (long8_ a, long8_ b),
  258. {
  259. return a.s0 < b.s3;
  260. });
  261. boost::compute::vector<long8_> vector(data.begin(), data.end(), queue);
  262. BOOST_CHECK_EQUAL(vector.size(), size);
  263. BOOST_CHECK(
  264. !boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
  265. );
  266. boost::compute::detail::merge_sort_on_gpu(
  267. vector.begin(), vector.end(), comp, queue
  268. );
  269. BOOST_CHECK(
  270. boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
  271. );
  272. }
  273. BOOST_AUTO_TEST_CASE(stable_sort_vector_int2)
  274. {
  275. if(is_apple_cpu_device(device)) {
  276. return;
  277. }
  278. using boost::compute::int2_;
  279. int2_ data[] = {
  280. int2_(8, 3), int2_(5, 1),
  281. int2_(2, 1), int2_(6, 1),
  282. int2_(8, 1), int2_(7, 1),
  283. int2_(4, 1), int2_(8, 2)
  284. };
  285. BOOST_COMPUTE_FUNCTION(bool, comp, (int2_ a, int2_ b),
  286. {
  287. return a.x < b.x;
  288. });
  289. boost::compute::vector<int2_> vector(data, data + 8, queue);
  290. BOOST_CHECK_EQUAL(vector.size(), 8);
  291. BOOST_CHECK(
  292. !boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
  293. );
  294. //
  295. boost::compute::detail::merge_sort_on_gpu(
  296. vector.begin(), vector.end(), comp, true /*stable*/, queue
  297. );
  298. BOOST_CHECK(
  299. boost::compute::is_sorted(vector.begin(), vector.end(), comp, queue)
  300. );
  301. CHECK_RANGE_EQUAL(
  302. int2_, 8, vector,
  303. (
  304. int2_(2, 1), int2_(4, 1),
  305. int2_(5, 1), int2_(6, 1),
  306. int2_(7, 1), int2_(8, 3),
  307. int2_(8, 1), int2_(8, 2)
  308. )
  309. );
  310. }
  311. BOOST_AUTO_TEST_SUITE_END()