From 489c5d76cfe95a97542dfeaa6d8b19cd9100919a Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Wed, 18 May 2016 21:32:56 +0200 Subject: Merged in latest changes from 0.7.1 release --- src/kernels/level3/xgemm_part2.opencl | 138 +++++++++++++++++----------------- 1 file changed, 71 insertions(+), 67 deletions(-) (limited to 'src/kernels/level3/xgemm_part2.opencl') diff --git a/src/kernels/level3/xgemm_part2.opencl b/src/kernels/level3/xgemm_part2.opencl index a8c8ebf5..56ccdb96 100644 --- a/src/kernels/level3/xgemm_part2.opencl +++ b/src/kernels/level3/xgemm_part2.opencl @@ -69,42 +69,43 @@ inline void MultiplyAccumulate(realM cpm[NWI][MWI/VWM], realM apm[MWI/VWM], real for (int ni=0; ni get_group_id(0)*MWG) { + if (GetGroupID1()*NWG > GetGroupID0()*MWG) { return; } -- cgit v1.2.3