diff options
author | mcian <mcian86@gmail.com> | 2017-07-31 14:02:12 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2017-07-31 14:02:12 +0200 |
commit | dc499065424af5dbf29a85bc6cbf4db9cd565cfd (patch) | |
tree | 3a7f9e86d30a1c700ae264caf46f0187c1e13177 /src/routines/level3 | |
parent | f2477f663672fd37301d6e2ce4646519f71d5cce (diff) | |
parent | 1155c068e982b1af19230c4c2d2e6dcb1d495414 (diff) |
Merge pull request #1 from CNugteren/master
fork up to date
Diffstat (limited to 'src/routines/level3')
-rw-r--r-- | src/routines/level3/xgemm.cpp | 8 |
1 files changed, 4 insertions, 4 deletions
diff --git a/src/routines/level3/xgemm.cpp b/src/routines/level3/xgemm.cpp index 30e5999c..f4611aba 100644 --- a/src/routines/level3/xgemm.cpp +++ b/src/routines/level3/xgemm.cpp @@ -280,11 +280,11 @@ void Xgemm<T>::GemmDirect(const size_t m, const size_t n, const size_t k, kernel.SetArgument(16, static_cast<int>(b_conjugate)); // Computes the global and local thread sizes - const auto m_ceiled = Ceil(m, db_["WGD"]); - const auto n_ceiled = Ceil(n, db_["WGD"]); + //const auto m_ceiled = Ceil(m, db_["WGD"]); + //const auto n_ceiled = Ceil(n, db_["WGD"]); const auto global = std::vector<size_t>{ - (m_ceiled * db_["MDIMCD"]) / db_["WGD"], - (n_ceiled * db_["NDIMCD"]) / db_["WGD"] + CeilDiv(m * db_["MDIMCD"], db_["WGD"]), + CeilDiv(n * db_["NDIMCD"], db_["WGD"]) }; const auto local = std::vector<size_t>{db_["MDIMCD"], db_["NDIMCD"]}; |