//#ifdef DOUBLE_PRECISION //#define FPTYPE double //#else //#define FPTYPE float //#endif __kernel void gemmN(const __global int* A, const __global int* B, ulong N, __global int* C) { // Thread identifiers const int globalRow = get_global_id(0); // Row ID of C (0..N) const int globalCol = get_global_id(1); // Col ID of C (0..N) // Compute a single element (loop over K) int acc = 0.0f; for (int k=0; k