From 60312e5878fd45225158dd8545a01366f937a871 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sun, 3 Dec 2017 12:00:37 +0100 Subject: Reformated transpose kernels for the pre-processor; extended the amount of tests --- src/kernels/level3/transpose_fast.opencl | 78 ++++++++++++++++---------------- src/kernels/level3/transpose_pad.opencl | 48 ++++++++++---------- test/correctness/misc/preprocessor.cpp | 25 ++++++++-- 3 files changed, 85 insertions(+), 66 deletions(-) diff --git a/src/kernels/level3/transpose_fast.opencl b/src/kernels/level3/transpose_fast.opencl index 37b25d99..8fa7405c 100644 --- a/src/kernels/level3/transpose_fast.opencl +++ b/src/kernels/level3/transpose_fast.opencl @@ -57,29 +57,31 @@ void TransposeMatrixFast(const int ld, // Loops over the work per thread #pragma unroll - for (int w_one=0; w_one