From d754586b49c6af64e049b625060ef7be08fa5525 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Fri, 10 Mar 2017 20:49:59 +0100 Subject: Added proper testing of the alpha parameter; finalized the batched AXPY implementation --- src/kernels/level1/xaxpy.opencl | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) (limited to 'src/kernels') diff --git a/src/kernels/level1/xaxpy.opencl b/src/kernels/level1/xaxpy.opencl index 3f5ab2b5..f44bbce0 100644 --- a/src/kernels/level1/xaxpy.opencl +++ b/src/kernels/level1/xaxpy.opencl @@ -57,9 +57,9 @@ void XaxpyFast(const int n, const real_arg arg_alpha, // Full version of the kernel with offsets and strided accesses: batched version __kernel __attribute__((reqd_work_group_size(WGS, 1, 1))) -void XaxpyBatched(const int n, const __global real_arg* arg_alphas, - const __global real* restrict xgm, const __global int* restrict x_offsets, const int x_inc, - __global real* ygm, const __global int* restrict y_offsets, const int y_inc) { +void XaxpyBatched(const int n, const __constant real_arg* arg_alphas, + const __global real* restrict xgm, const __constant int* x_offsets, const int x_inc, + __global real* ygm, const __constant int* y_offsets, const int y_inc) { const int batch = get_group_id(1); const real alpha = GetRealArg(arg_alphas[batch]); -- cgit v1.2.3