summaryrefslogtreecommitdiff
path: root/src/kernels/level1/xdot.opencl
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-12-03 16:40:36 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2017-12-03 16:40:36 +0100
commitcf4555d1f44aea9c82b60211b5650b6b77a1226c (patch)
tree459676fcf89b85aaab7b014d935d1f5b3ab984fc /src/kernels/level1/xdot.opencl
parent0a1a3de58a410f61f3b990537541a633826ea640 (diff)
Added GEMM (direct and in-direct) to the pre-processor testing; modified the loops in kernel accordingly
Diffstat (limited to 'src/kernels/level1/xdot.opencl')
-rw-r--r--src/kernels/level1/xdot.opencl2
1 files changed, 0 insertions, 2 deletions
diff --git a/src/kernels/level1/xdot.opencl b/src/kernels/level1/xdot.opencl
index 02f04ea7..1a703d96 100644
--- a/src/kernels/level1/xdot.opencl
+++ b/src/kernels/level1/xdot.opencl
@@ -55,7 +55,6 @@ void Xdot(const int n,
barrier(CLK_LOCAL_MEM_FENCE);
// Performs reduction in local memory
- #pragma unroll
for (int s=WGS1/2; s>0; s=s>>1) {
if (lid < s) {
Add(lm[lid], lm[lid], lm[lid + s]);
@@ -84,7 +83,6 @@ void XdotEpilogue(const __global real* restrict input,
barrier(CLK_LOCAL_MEM_FENCE);
// Performs reduction in local memory
- #pragma unroll
for (int s=WGS2/2; s>0; s=s>>1) {
if (lid < s) {
Add(lm[lid], lm[lid], lm[lid + s]);