diff options
Diffstat (limited to 'src/kernels/level2')
-rw-r--r-- | src/kernels/level2/xgemv.opencl | 2 | ||||
-rw-r--r-- | src/kernels/level2/xgemv_fast.opencl | 4 | ||||
-rw-r--r-- | src/kernels/level2/xger.opencl | 2 | ||||
-rw-r--r-- | src/kernels/level2/xher.opencl | 2 | ||||
-rw-r--r-- | src/kernels/level2/xher2.opencl | 2 | ||||
-rw-r--r-- | src/kernels/level2/xtrsv.opencl | 4 |
6 files changed, 8 insertions, 8 deletions
diff --git a/src/kernels/level2/xgemv.opencl b/src/kernels/level2/xgemv.opencl index 16711aa4..15912a60 100644 --- a/src/kernels/level2/xgemv.opencl +++ b/src/kernels/level2/xgemv.opencl @@ -212,7 +212,7 @@ INLINE_FUNC real LoadMatrixA(const __global real* restrict agm, const int x, con // Full version of the kernel #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(WGS1, 1, 1))) #endif void Xgemv(const int m, const int n, diff --git a/src/kernels/level2/xgemv_fast.opencl b/src/kernels/level2/xgemv_fast.opencl index 853d3d28..46087af7 100644 --- a/src/kernels/level2/xgemv_fast.opencl +++ b/src/kernels/level2/xgemv_fast.opencl @@ -90,7 +90,7 @@ INLINE_FUNC realVF LoadMatrixAVF(const __global realVF* restrict agm, const int // --> 'do_conjugate' is 0 #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(WGS2, 1, 1))) #endif void XgemvFast(const int m, const int n, @@ -197,7 +197,7 @@ void XgemvFast(const int m, const int n, // --> 'do_conjugate' is 0 #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(WGS3, 1, 1))) #endif void XgemvFastRot(const int m, const int n, diff --git a/src/kernels/level2/xger.opencl b/src/kernels/level2/xger.opencl index 3620c66a..b1fe8447 100644 --- a/src/kernels/level2/xger.opencl +++ b/src/kernels/level2/xger.opencl @@ -20,7 +20,7 @@ R"( // Regular version of the rank-1 matrix update kernel (GER, GERU, GERC) #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(WGS1, WGS2, 1))) #endif void Xger(const int max1, const int max2, diff --git a/src/kernels/level2/xher.opencl b/src/kernels/level2/xher.opencl index 9e460cd4..eac8c10a 100644 --- a/src/kernels/level2/xher.opencl +++ b/src/kernels/level2/xher.opencl @@ -20,7 +20,7 @@ R"( // Symmetric version of the rank-1 matrix update kernel (HER, HPR, SYR, SPR) #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(WGS1, WGS2, 1))) #endif void Xher(const int n, diff --git a/src/kernels/level2/xher2.opencl b/src/kernels/level2/xher2.opencl index c3e85c15..9e7f3c6c 100644 --- a/src/kernels/level2/xher2.opencl +++ b/src/kernels/level2/xher2.opencl @@ -20,7 +20,7 @@ R"( // Symmetric version of the rank-2 matrix update kernel (HER2, HPR2, SYR2, SPR2) #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(WGS1, WGS2, 1))) #endif void Xher2(const int n, diff --git a/src/kernels/level2/xtrsv.opencl b/src/kernels/level2/xtrsv.opencl index e3b5418c..7677377e 100644 --- a/src/kernels/level2/xtrsv.opencl +++ b/src/kernels/level2/xtrsv.opencl @@ -41,7 +41,7 @@ void FillVector(const int n, const int inc, const int offset, #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(TRSV_BLOCK_SIZE, 1, 1))) #endif void trsv_forward(int n, @@ -93,7 +93,7 @@ void trsv_forward(int n, #if RELAX_WORKGROUP_SIZE == 1 __kernel -#elif +#else __kernel __attribute__((reqd_work_group_size(TRSV_BLOCK_SIZE, 1, 1))) #endif void trsv_backward(int n, |