summaryrefslogtreecommitdiff
path: root/src/routines/level2/xtrsv.cpp
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2018-05-31 22:37:06 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2018-05-31 22:37:06 +0200
commit5702bff5ad579466397f6537dc8925ebd64e3ba3 (patch)
treeb375ab600530fda9ac42aa0ab908b1f8fcd7042a /src/routines/level2/xtrsv.cpp
parente609220393654e5400b0acd0d362367f5fe28ab8 (diff)
Added error-checking for half-empty local work group sizes; fixed a minor TRSV global worksize issue
Diffstat (limited to 'src/routines/level2/xtrsv.cpp')
-rw-r--r--src/routines/level2/xtrsv.cpp2
1 files changed, 1 insertions, 1 deletions
diff --git a/src/routines/level2/xtrsv.cpp b/src/routines/level2/xtrsv.cpp
index 5d2ddf54..76401753 100644
--- a/src/routines/level2/xtrsv.cpp
+++ b/src/routines/level2/xtrsv.cpp
@@ -68,7 +68,7 @@ void Xtrsv<T>::Substitution(const Layout layout, const Triangle triangle,
// Launches the kernel
const auto local = std::vector<size_t>{db_["TRSV_BLOCK_SIZE"]};
- const auto global = std::vector<size_t>{1};
+ const auto global = std::vector<size_t>{Ceil(n, db_["TRSV_BLOCK_SIZE"])};
auto event = Event();
RunKernel(kernel, queue_, device_, global, local, event.pointer());
event.WaitForCompletion();