#include #include #include #include #include #include #include template void print_sparse_vector(const IndexVector& A_index, const ValueVector& A_value) { assert(A_index.size() == A_value.size()); for(size_t i = 0; i < A_index.size(); i++) std::cout << "(" << A_index[i] << "," << A_value[i] << ") "; std::cout << std::endl; } template void sum_sparse_vectors(const IndexVector1& A_index, const ValueVector1& A_value, const IndexVector2& B_index, const ValueVector2& B_value, IndexVector3& C_index, ValueVector3& C_value) { typedef typename IndexVector3::value_type IndexType; typedef typename ValueVector3::value_type ValueType; assert(A_index.size() == A_value.size()); assert(B_index.size() == B_value.size()); size_t A_size = A_index.size(); size_t B_size = B_index.size(); // allocate storage for the combined contents of sparse vectors A and B IndexVector3 temp_index(A_size + B_size); ValueVector3 temp_value(A_size + B_size); // merge A and B by index thrust::merge_by_key(A_index.begin(), A_index.end(), B_index.begin(), B_index.end(), A_value.begin(), B_value.begin(), temp_index.begin(), temp_value.begin()); // compute number of unique indices size_t C_size = thrust::inner_product(temp_index.begin(), temp_index.end() - 1, temp_index.begin() + 1, size_t(0), thrust::plus(), thrust::not_equal_to()) + 1; // allocate space for output C_index.resize(C_size); C_value.resize(C_size); // sum values with the same index thrust::reduce_by_key(temp_index.begin(), temp_index.end(), temp_value.begin(), C_index.begin(), C_value.begin(), thrust::equal_to(), thrust::plus()); } int main(void) { // initialize sparse vector A with 4 elements thrust::device_vector A_index(4); thrust::device_vector A_value(4); A_index[0] = 2; A_value[0] = 10; A_index[1] = 3; A_value[1] = 60; A_index[2] = 5; A_value[2] = 20; A_index[3] = 8; A_value[3] = 40; // initialize sparse vector B with 6 elements thrust::device_vector B_index(6); thrust::device_vector B_value(6); B_index[0] = 1; B_value[0] = 50; B_index[1] = 2; B_value[1] = 30; B_index[2] = 4; B_value[2] = 80; B_index[3] = 5; B_value[3] = 30; B_index[4] = 7; B_value[4] = 90; B_index[5] = 8; B_value[5] = 10; // compute sparse vector C = A + B thrust::device_vector C_index; thrust::device_vector C_value; sum_sparse_vectors(A_index, A_value, B_index, B_value, C_index, C_value); std::cout << "Computing C = A + B for sparse vectors A and B" << std::endl; std::cout << "A "; print_sparse_vector(A_index, A_value); std::cout << "B "; print_sparse_vector(B_index, B_value); std::cout << "C "; print_sparse_vector(C_index, C_value); }