summaryrefslogtreecommitdiff
path: root/src/routines
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-09-25 14:48:34 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-09-25 14:48:34 +0200
commit73d135c2cef9763b47d410b125eb8bb89ece8432 (patch)
treebc7aa23b620f717b04a348444f2a50164fa2f169 /src/routines
parent669f43aed65ccd4aae9c4a478e994660f3e2a592 (diff)
Added a first version of a tuner for the GEMM direct kernel; collapsed MWGD, NWGD and KWGD into one WGD parameter
Diffstat (limited to 'src/routines')
-rw-r--r--src/routines/level3/xgemm.cpp8
1 files changed, 4 insertions, 4 deletions
diff --git a/src/routines/level3/xgemm.cpp b/src/routines/level3/xgemm.cpp
index 2fb9f1fd..e050e844 100644
--- a/src/routines/level3/xgemm.cpp
+++ b/src/routines/level3/xgemm.cpp
@@ -300,11 +300,11 @@ StatusCode Xgemm<T>::GemmDirect(const size_t m, const size_t n, const size_t k,
kernel.SetArgument(18, static_cast<int>(b_conjugate));
// Computes the global and local thread sizes
- const auto m_ceiled = Ceil(m, db_["MWGD"]);
- const auto n_ceiled = Ceil(n, db_["NWGD"]);
+ const auto m_ceiled = Ceil(m, db_["WGD"]);
+ const auto n_ceiled = Ceil(n, db_["WGD"]);
const auto global = std::vector<size_t>{
- (m_ceiled * db_["MDIMCD"]) / db_["MWGD"],
- (n_ceiled * db_["NDIMCD"]) / db_["NWGD"]
+ (m_ceiled * db_["MDIMCD"]) / db_["WGD"],
+ (n_ceiled * db_["NDIMCD"]) / db_["WGD"]
};
const auto local = std::vector<size_t>{db_["MDIMCD"], db_["NDIMCD"]};