diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2018-05-31 20:09:49 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2018-05-31 20:09:49 +0200 |
commit | e609220393654e5400b0acd0d362367f5fe28ab8 (patch) | |
tree | abb4ed1edf5f483e4ecc89b68614b87c922e4af9 /src/routines | |
parent | ff4d5558a6d945592cc51760628a77237cd30f67 (diff) |
Some potential fixes for error -54 when launching TRSV and TRSM kernels
Diffstat (limited to 'src/routines')
-rw-r--r-- | src/routines/levelx/xinvert.cpp | 3 |
1 files changed, 2 insertions, 1 deletions
diff --git a/src/routines/levelx/xinvert.cpp b/src/routines/levelx/xinvert.cpp index 65a28d73..09ef3ec1 100644 --- a/src/routines/levelx/xinvert.cpp +++ b/src/routines/levelx/xinvert.cpp @@ -113,7 +113,8 @@ void Xinvert<T>::InvertMatrixDiagonalBlocks(const Layout layout, const Triangle const auto npages = CeilDiv(n, current_size*2); const auto local0 = (current_size <= 32) ? current_size/4 : 16; const auto local = std::vector<size_t>{local0, 4}; - const auto global = std::vector<size_t>{(current_size/local[1]), npages*(current_size/16)*local[1]}; + const auto global = std::vector<size_t>{Ceil(current_size/local[1], local[0]), + Ceil(npages*(current_size/16)*local[1], local[1])}; // Part 1 auto kernel1 = Kernel(program_, "TripleMatMul" + ToString(current_size) + "Part1" + name_postfix); |