From 01d254c0b09549bb7921d1c777d1d53042c5d466 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sun, 27 May 2018 18:38:47 +0200 Subject: Added a check to return 'NotImplemented' error code in case of systems with < 16 LWGS for TSRV and TRSM --- src/routines/levelx/xinvert.cpp | 5 +++++ 1 file changed, 5 insertions(+) (limited to 'src/routines/levelx') diff --git a/src/routines/levelx/xinvert.cpp b/src/routines/levelx/xinvert.cpp index d851e0b9..65a28d73 100644 --- a/src/routines/levelx/xinvert.cpp +++ b/src/routines/levelx/xinvert.cpp @@ -49,6 +49,11 @@ void Xinvert::InvertMatrixDiagonalBlocks(const Layout layout, const Triangle throw BLASError(StatusCode::kInvalidDimension); } + // Some parts of this kernel are not tunable and thus require some minimal OpenCL properties + if (device_.MaxWorkGroupSize() < 16) { // minimum of total local work size of 16 + throw RuntimeErrorCode(StatusCode::kNotImplemented); + } + // Helper variables const auto internal_block_size = static_cast(db_["INTERNAL_BLOCK_SIZE"]); assert(internal_block_size == 16); -- cgit v1.2.3