summaryrefslogtreecommitdiff
path: root/test/correctness
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-12-03 12:00:37 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2017-12-03 12:00:37 +0100
commit60312e5878fd45225158dd8545a01366f937a871 (patch)
tree0755588371b125df6f5c3a9e4be04a0ca53bdd63 /test/correctness
parent92842024b0e9fb2df8e8e43c4499d0d2d13fefc0 (diff)
Reformated transpose kernels for the pre-processor; extended the amount of tests
Diffstat (limited to 'test/correctness')
-rw-r--r--test/correctness/misc/preprocessor.cpp25
1 files changed, 21 insertions, 4 deletions
diff --git a/test/correctness/misc/preprocessor.cpp b/test/correctness/misc/preprocessor.cpp
index cea91116..d352ce37 100644
--- a/test/correctness/misc/preprocessor.cpp
+++ b/test/correctness/misc/preprocessor.cpp
@@ -133,6 +133,7 @@ size_t RunPreprocessor(int argc, char *argv[], const bool silent, const Precisio
"#define WPT2 2\n"
"#define WPT3 2\n"
"#define UNROLL1 4\n"
+ "#define VW2 2\n"
#include "../src/kernels/level2/xgemv.opencl"
#include "../src/kernels/level2/xgemv_fast.opencl"
;
@@ -148,13 +149,29 @@ size_t RunPreprocessor(int argc, char *argv[], const bool silent, const Precisio
// CopyPad
const auto copy_pad_sources =
- "#define PAD_WPTX 2\n"
- "#define PAD_WPTY 2\n"
-#include "../src/kernels/level3/level3.opencl"
-#include "../src/kernels/level3/copy_pad.opencl"
+ "#define PAD_WPTX 2\n"
+ "#define PAD_WPTY 2\n"
+ #include "../src/kernels/level3/level3.opencl"
+ #include "../src/kernels/level3/copy_pad.opencl"
;
if (TestKernel(device, context, "CopyPadMatrix", copy_pad_sources, precision)) { passed++; } else { errors++; }
+ // TransposeFast
+ const auto transpose_fast_sources =
+ "#define TRA_WPT 2\n"
+ #include "../src/kernels/level3/level3.opencl"
+ #include "../src/kernels/level3/transpose_fast.opencl"
+ ;
+ if (TestKernel(device, context, "TransposeMatrixFast", transpose_fast_sources, precision)) { passed++; } else { errors++; }
+
+ // TransposePad
+ const auto transpose_pad_sources =
+ "#define PADTRA_WPT 2\n"
+ #include "../src/kernels/level3/level3.opencl"
+ #include "../src/kernels/level3/transpose_pad.opencl"
+ ;
+ if (TestKernel(device, context, "TransposePadMatrix", transpose_pad_sources, precision)) { passed++; } else { errors++; }
+
// Prints and returns the statistics