#include #include #include template __global__ void max_element_kernel(ExecutionPolicy exec, Iterator first, Iterator last, Iterator2 result) { *result = thrust::max_element(exec, first, last); } template __global__ void max_element_kernel(ExecutionPolicy exec, Iterator first, Iterator last, BinaryPredicate pred, Iterator2 result) { *result = thrust::max_element(exec, first, last, pred); } template void TestMaxElementDevice(ExecutionPolicy exec) { size_t n = 1000; thrust::host_vector h_data = unittest::random_samples(n); thrust::device_vector d_data = h_data; typedef typename thrust::device_vector::iterator iter_type; thrust::device_vector d_result(1); typename thrust::host_vector::iterator h_max = thrust::max_element(h_data.begin(), h_data.end()); max_element_kernel<<<1,1>>>(exec, d_data.begin(), d_data.end(), d_result.begin()); { cudaError_t const err = cudaDeviceSynchronize(); ASSERT_EQUAL(cudaSuccess, err); } ASSERT_EQUAL(h_max - h_data.begin(), (iter_type)d_result[0] - d_data.begin()); typename thrust::host_vector::iterator h_min = thrust::max_element(h_data.begin(), h_data.end(), thrust::greater()); max_element_kernel<<<1,1>>>(exec, d_data.begin(), d_data.end(), thrust::greater(), d_result.begin()); { cudaError_t const err = cudaDeviceSynchronize(); ASSERT_EQUAL(cudaSuccess, err); } ASSERT_EQUAL(h_min - h_data.begin(), (iter_type)d_result[0] - d_data.begin()); } void TestMaxElementDeviceSeq() { TestMaxElementDevice(thrust::seq); } DECLARE_UNITTEST(TestMaxElementDeviceSeq); void TestMaxElementDeviceDevice() { TestMaxElementDevice(thrust::device); } DECLARE_UNITTEST(TestMaxElementDeviceDevice); void TestMaxElementDeviceNoSync() { TestMaxElementDevice(thrust::cuda::par_nosync); } DECLARE_UNITTEST(TestMaxElementDeviceNoSync); template void TestMaxElementCudaStreams(ExecutionPolicy policy) { typedef thrust::device_vector Vector; typedef Vector::value_type T; Vector data(6); data[0] = 3; data[1] = 5; data[2] = 1; data[3] = 2; data[4] = 5; data[5] = 1; cudaStream_t s; cudaStreamCreate(&s); auto streampolicy = policy.on(s); ASSERT_EQUAL( *thrust::max_element(streampolicy, data.begin(), data.end()), 5); ASSERT_EQUAL( thrust::max_element(streampolicy, data.begin(), data.end()) - data.begin(), 1); ASSERT_EQUAL( *thrust::max_element(streampolicy, data.begin(), data.end(), thrust::greater()), 1); ASSERT_EQUAL( thrust::max_element(streampolicy, data.begin(), data.end(), thrust::greater()) - data.begin(), 2); cudaStreamDestroy(s); } void TestMaxElementCudaStreamsSync(){ TestMaxElementCudaStreams(thrust::cuda::par); } DECLARE_UNITTEST(TestMaxElementCudaStreamsSync); void TestMaxElementCudaStreamsNoSync(){ TestMaxElementCudaStreams(thrust::cuda::par_nosync); } DECLARE_UNITTEST(TestMaxElementCudaStreamsNoSync); void TestMaxElementDevicePointer() { typedef thrust::device_vector Vector; typedef Vector::value_type T; Vector data(6); data[0] = 3; data[1] = 5; data[2] = 1; data[3] = 2; data[4] = 5; data[5] = 1; T* raw_ptr = thrust::raw_pointer_cast(data.data()); size_t n = data.size(); ASSERT_EQUAL( thrust::max_element(thrust::device, raw_ptr, raw_ptr+n) - raw_ptr, 1); ASSERT_EQUAL( thrust::max_element(thrust::device, raw_ptr, raw_ptr+n, thrust::greater()) - raw_ptr, 2); } DECLARE_UNITTEST(TestMaxElementDevicePointer);