From cf4555d1f44aea9c82b60211b5650b6b77a1226c Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sun, 3 Dec 2017 16:40:36 +0100 Subject: Added GEMM (direct and in-direct) to the pre-processor testing; modified the loops in kernel accordingly --- src/kernels/level3/xgemm_direct_part1.opencl | 90 ++++++++++++++-------------- 1 file changed, 45 insertions(+), 45 deletions(-) (limited to 'src/kernels/level3/xgemm_direct_part1.opencl') diff --git a/src/kernels/level3/xgemm_direct_part1.opencl b/src/kernels/level3/xgemm_direct_part1.opencl index 7d185224..e2f9c6a8 100644 --- a/src/kernels/level3/xgemm_direct_part1.opencl +++ b/src/kernels/level3/xgemm_direct_part1.opencl @@ -95,10 +95,10 @@ R"( // Initializes the accumulation registers to zero INLINE_FUNC void InitAccRegistersDirect(real cpm[NWID][MWID]) { #pragma unroll - for (int mi=0; mi