From 9f02fb542ca659bf58d1efefdb334ea386ef10e8 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sat, 9 Dec 2017 20:44:21 +0100 Subject: Completed kernel modifications for pre-processor of all other kernels --- src/kernels/level2/xher.opencl | 24 +++++++++++++----------- 1 file changed, 13 insertions(+), 11 deletions(-) (limited to 'src/kernels/level2/xher.opencl') diff --git a/src/kernels/level2/xher.opencl b/src/kernels/level2/xher.opencl index b0772218..8a57bdfc 100644 --- a/src/kernels/level2/xher.opencl +++ b/src/kernels/level2/xher.opencl @@ -27,32 +27,34 @@ void Xher(const int n, const real alpha = GetRealArg(arg_alpha); // Register storage for X and XT + #pragma promote_to_registers real xvalues[WPT]; + #pragma promote_to_registers real xtvalues[WPT]; // Loads the X-vector #pragma unroll - for (int w=0; w id2)) || (!is_upper && (id2 > id1))) { @@ -61,7 +63,7 @@ void Xher(const int n, // Loads A, performs the operation, and stores the result into A else { - MatrixUpdate(id1, id2, n, n, agm, a_offset, a_ld, alpha, xvalues[w2], xtvalues[w1], is_upper); + MatrixUpdate(id1, id2, n, n, agm, a_offset, a_ld, alpha, xvalues[_w2], xtvalues[_w1], is_upper); } } } -- cgit v1.2.3