#include #include #include template __global__ void transform_reduce_kernel(ExecutionPolicy exec, Iterator1 first, Iterator1 last, Function1 f1, T init, Function2 f2, Iterator2 result) { *result = thrust::transform_reduce(exec, first, last, f1, init, f2); } template void TestTransformReduceDevice(ExecutionPolicy exec) { typedef thrust::device_vector Vector; typedef typename Vector::value_type T; Vector data(3); data[0] = 1; data[1] = -2; data[2] = 3; T init = 10; thrust::device_vector result(1); transform_reduce_kernel<<<1,1>>>(exec, data.begin(), data.end(), thrust::negate(), init, thrust::plus(), result.begin()); cudaError_t const err = cudaDeviceSynchronize(); ASSERT_EQUAL(cudaSuccess, err); ASSERT_EQUAL(8, (T)result[0]); } void TestTransformReduceDeviceSeq() { TestTransformReduceDevice(thrust::seq); } DECLARE_UNITTEST(TestTransformReduceDeviceSeq); void TestTransformReduceDeviceDevice() { TestTransformReduceDevice(thrust::device); } DECLARE_UNITTEST(TestTransformReduceDeviceDevice); void TestTransformReduceCudaStreams() { typedef thrust::device_vector Vector; typedef Vector::value_type T; Vector data(3); data[0] = 1; data[1] = -2; data[2] = 3; T init = 10; cudaStream_t s; cudaStreamCreate(&s); T result = thrust::transform_reduce(thrust::cuda::par.on(s), data.begin(), data.end(), thrust::negate(), init, thrust::plus()); cudaStreamSynchronize(s); ASSERT_EQUAL(8, result); cudaStreamDestroy(s); } DECLARE_UNITTEST(TestTransformReduceCudaStreams);