From 99afdcd9080e4b2e8b26d4bd7324a92714c71e89 Mon Sep 17 00:00:00 2001 From: mcian Date: Mon, 31 Jul 2017 14:06:23 +0200 Subject: Restore direct GEMM to previous version --- src/routines/level3/xgemm.cpp | 10 ++++++---- 1 file changed, 6 insertions(+), 4 deletions(-) (limited to 'src/routines/level3') diff --git a/src/routines/level3/xgemm.cpp b/src/routines/level3/xgemm.cpp index f4611aba..136eec43 100644 --- a/src/routines/level3/xgemm.cpp +++ b/src/routines/level3/xgemm.cpp @@ -280,11 +280,13 @@ void Xgemm::GemmDirect(const size_t m, const size_t n, const size_t k, kernel.SetArgument(16, static_cast(b_conjugate)); // Computes the global and local thread sizes - //const auto m_ceiled = Ceil(m, db_["WGD"]); - //const auto n_ceiled = Ceil(n, db_["WGD"]); + const auto m_ceiled = Ceil(m, db_["WGD"]); + const auto n_ceiled = Ceil(n, db_["WGD"]); const auto global = std::vector{ - CeilDiv(m * db_["MDIMCD"], db_["WGD"]), - CeilDiv(n * db_["NDIMCD"], db_["WGD"]) + // CeilDiv(m * db_["MDIMCD"], db_["WGD"]), + // CeilDiv(n * db_["NDIMCD"], db_["WGD"]) + (m_ceiled * db_["MDIMCD"]) / db_["WGD"], + (n_ceiled * db_["NDIMCD"]) / db_["WGD"] }; const auto local = std::vector{db_["MDIMCD"], db_["NDIMCD"]}; -- cgit v1.2.3