summaryrefslogtreecommitdiff
path: root/src/routines/levelx/xgemmstridedbatched.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/routines/levelx/xgemmstridedbatched.cpp')
-rw-r--r--src/routines/levelx/xgemmstridedbatched.cpp6
1 files changed, 4 insertions, 2 deletions
diff --git a/src/routines/levelx/xgemmstridedbatched.cpp b/src/routines/levelx/xgemmstridedbatched.cpp
index 48383cbd..8408f75a 100644
--- a/src/routines/levelx/xgemmstridedbatched.cpp
+++ b/src/routines/levelx/xgemmstridedbatched.cpp
@@ -66,7 +66,8 @@ void XgemmStridedBatched<T>::DoGemmStridedBatched(const Layout layout, const Tra
size_t a_one, a_two, b_one, b_two, c_one, c_two;
Xgemm<T>::ProcessArguments(layout, a_transpose, b_transpose, m, n, k,
a_one, a_two, b_one, b_two, c_one, c_two,
- a_do_transpose, b_do_transpose, c_do_transpose, a_conjugate, b_conjugate);
+ a_do_transpose, b_do_transpose, c_do_transpose, a_conjugate, b_conjugate,
+ db_["GEMMK"]);
// Tests the matrices for validity
for (auto batch = size_t{0}; batch < batch_count; ++batch) {
@@ -122,7 +123,8 @@ void XgemmStridedBatched<T>::BatchedGemmIndirect(const size_t m, const size_t n,
// whether the matrices need to be rotated or not for the kernel.
size_t a_one_i, a_two_i, b_one_i, b_two_i, c_one_i, c_two_i;
Xgemm<T>::CalculateInternalDimensions(m, n, k, db_["MWG"], db_["NWG"], db_["KWG"],
- a_one_i, a_two_i, b_one_i, b_two_i, c_one_i, c_two_i);
+ a_one_i, a_two_i, b_one_i, b_two_i, c_one_i, c_two_i,
+ db_["GEMMK"]);
// Determines whether or not temporary matrices are needed
auto a_no_temp = a_one == a_one_i && a_two == a_two_i && a_ld == a_one && !a_do_transpose && !a_conjugate;