//---------------------------------------------------------------------------// // Copyright (c) 2013-2014 Kyle Lutz // // Distributed under the Boost Software License, Version 1.0 // See accompanying file LICENSE_1_0.txt or copy at // http://www.boost.org/LICENSE_1_0.txt // // See http://boostorg.github.com/compute for more information. //---------------------------------------------------------------------------// #include #include #include #include #include #include #include #include "perf.hpp" int main(int argc, char *argv[]) { perf_parse_args(argc, argv); std::cout << "size: " << PERF_N << std::endl; thrust::host_vector v1(std::floor(PERF_N / 2.0)); thrust::host_vector v2(std::ceil(PERF_N / 2.0)); std::generate(v1.begin(), v1.end(), rand); std::generate(v2.begin(), v2.end(), rand); std::sort(v1.begin(), v1.end()); std::sort(v2.begin(), v2.end()); // transfer data to the device thrust::device_vector gpu_v1 = v1; thrust::device_vector gpu_v2 = v2; thrust::device_vector gpu_v3(PERF_N); perf_timer t; for(size_t trial = 0; trial < PERF_TRIALS; trial++){ t.start(); thrust::merge( gpu_v1.begin(), gpu_v1.end(), gpu_v2.begin(), gpu_v2.end(), gpu_v3.begin() ); cudaDeviceSynchronize(); t.stop(); } std::cout << "time: " << t.min_time() / 1e6 << " ms" << std::endl; thrust::host_vector check_v3 = gpu_v3; thrust::host_vector v3(PERF_N); std::merge(v1.begin(), v1.end(), v2.begin(), v2.end(), v3.begin()); bool ok = std::equal(check_v3.begin(), check_v3.end(), v3.begin()); if(!ok){ std::cerr << "ERROR: merged ranges different" << std::endl; return -1; } return 0; }