//------------------------------------------------------------------------------ // GB_AxB_saxpy4_jit: C+=A*B saxpy4 method, via the JIT //------------------------------------------------------------------------------ // SuiteSparse:GraphBLAS, Timothy A. Davis, (c) 2017-2023, All Rights Reserved. // SPDX-License-Identifier: Apache-2.0 //------------------------------------------------------------------------------ #include "GB.h" #include "GB_stringify.h" typedef GB_JIT_KERNEL_AXB_SAXPY4_PROTO ((*GB_jit_dl_function)) ; GrB_Info GB_AxB_saxpy4_jit // C+=A*B, saxpy4 method, via the JIT ( // input/output: GrB_Matrix C, // input: const GrB_Matrix A, const GrB_Matrix B, const GrB_Semiring semiring, const bool flipxy, const int ntasks, const int nthreads, const int nfine_tasks_per_vector, const bool use_coarse_tasks, const bool use_atomics, const int64_t *A_slice, const int64_t *H_slice, GB_void *restrict Wcx, int8_t *restrict Wf ) { //-------------------------------------------------------------------------- // encodify the problem //-------------------------------------------------------------------------- GB_jit_encoding encoding ; char *suffix ; ASSERT (!C->iso) ; ASSERT (GB_IS_FULL (C)) ; uint64_t hash = GB_encodify_mxm (&encoding, &suffix, GB_JIT_KERNEL_AXB_SAXPY4, false, false, GxB_FULL, C->type, NULL, true, false, semiring, flipxy, A, B) ; //-------------------------------------------------------------------------- // get the kernel function pointer, loading or compiling it if needed //-------------------------------------------------------------------------- void *dl_function ; GrB_Info info = GB_jitifyer_load (&dl_function, GB_jit_mxm_family, "AxB_saxpy4", hash, &encoding, suffix, semiring, NULL, NULL, C->type, A->type, B->type) ; if (info != GrB_SUCCESS) return (info) ; //-------------------------------------------------------------------------- // call the jit kernel and return result //-------------------------------------------------------------------------- GB_jit_dl_function GB_jit_kernel = (GB_jit_dl_function) dl_function ; return (GB_jit_kernel (C, A, B, ntasks, nthreads, nfine_tasks_per_vector, use_coarse_tasks, use_atomics, A_slice, H_slice, Wcx, Wf)) ; }