diff options
author | D. Van Assche <dimitri.vanassche@macq.eu> | 2016-08-18 17:33:13 +0200 |
---|---|---|
committer | D. Van Assche <dimitri.vanassche@macq.eu> | 2016-08-18 17:33:13 +0200 |
commit | 57f1aa76857cf0566e05b43b9b2a98a3a6139c8b (patch) | |
tree | 4ed277095302ea0870b764dde32936dad56bb410 /src/kernels/level3/xgemm_part2.opencl | |
parent | 7c13bacf129291e3e295ecb6e833788477085fa0 (diff) |
Adapt opencl files for 1.1 OpenCL
In OpenCL 1.1 __kernel has to be before __attribute__, at least with
Vivante compiler.
Diffstat (limited to 'src/kernels/level3/xgemm_part2.opencl')
-rw-r--r-- | src/kernels/level3/xgemm_part2.opencl | 12 |
1 files changed, 6 insertions, 6 deletions
diff --git a/src/kernels/level3/xgemm_part2.opencl b/src/kernels/level3/xgemm_part2.opencl index 42c1127c..60e38c06 100644 --- a/src/kernels/level3/xgemm_part2.opencl +++ b/src/kernels/level3/xgemm_part2.opencl @@ -268,8 +268,8 @@ inline void XgemmBody(const int kSizeM, const int kSizeN, const int kSizeK, #if defined(ROUTINE_SYRK) || defined(ROUTINE_HERK) || defined(ROUTINE_SYR2K) || defined(ROUTINE_HER2K) // Main entry point of the kernel. This is the upper-triangular version. -__attribute__((reqd_work_group_size(MDIMC, NDIMC, 1))) -__kernel void XgemmUpper(const int kSizeN, const int kSizeK, +__kernel __attribute__((reqd_work_group_size(MDIMC, NDIMC, 1))) +void XgemmUpper(const int kSizeN, const int kSizeK, const __constant real* restrict arg_alpha, const __constant real* restrict arg_beta, const __global realM* restrict agm, @@ -308,8 +308,8 @@ __kernel void XgemmUpper(const int kSizeN, const int kSizeK, } // Main entry point of the kernel. This is the lower-triangular version. -__attribute__((reqd_work_group_size(MDIMC, NDIMC, 1))) -__kernel void XgemmLower(const int kSizeN, const int kSizeK, +__kernel __attribute__((reqd_work_group_size(MDIMC, NDIMC, 1))) +void XgemmLower(const int kSizeN, const int kSizeK, const __constant real* restrict arg_alpha, const __constant real* restrict arg_beta, const __global realM* restrict agm, @@ -352,8 +352,8 @@ __kernel void XgemmLower(const int kSizeN, const int kSizeK, #else // Main entry point of the kernel. This is the regular full version. -__attribute__((reqd_work_group_size(MDIMC, NDIMC, 1))) -__kernel void Xgemm(const int kSizeM, const int kSizeN, const int kSizeK, +__kernel __attribute__((reqd_work_group_size(MDIMC, NDIMC, 1))) +void Xgemm(const int kSizeM, const int kSizeN, const int kSizeK, const __constant real* restrict arg_alpha, const __constant real* restrict arg_beta, const __global realM* restrict agm, |