diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2016-06-16 18:07:46 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2016-06-16 18:07:46 +0200 |
commit | 52ccaf5b25e14c9ce032315e5e96b1f27886d481 (patch) | |
tree | 087288b7aebf2a06ffc4e7dcbcd4353f7a3be6a7 /src/routines/level3/xgemm.cc | |
parent | 39b7dbc5e37829abfbcfb77852b9138b31540b42 (diff) |
Added XOMATCOPY routines to perform out-of-place matrix scaling, copying, and/or transposing
Diffstat (limited to 'src/routines/level3/xgemm.cc')
-rw-r--r-- | src/routines/level3/xgemm.cc | 12 |
1 files changed, 8 insertions, 4 deletions
diff --git a/src/routines/level3/xgemm.cc b/src/routines/level3/xgemm.cc index 6fa6a811..42d5f19e 100644 --- a/src/routines/level3/xgemm.cc +++ b/src/routines/level3/xgemm.cc @@ -145,7 +145,8 @@ StatusCode Xgemm<T>::DoGemm(const Layout layout, status = PadCopyTransposeMatrix(eventProcessA.pointer(), emptyEventList, a_one, a_two, a_ld, a_offset, a_buffer, m_ceiled, k_ceiled, m_ceiled, 0, a_temp, - program, true, a_do_transpose, a_conjugate); + ConstantOne<T>(), program, + true, a_do_transpose, a_conjugate); if (ErrorIn(status)) { return status; } eventWaitList.push_back(eventProcessA); } @@ -156,7 +157,8 @@ StatusCode Xgemm<T>::DoGemm(const Layout layout, status = PadCopyTransposeMatrix(eventProcessB.pointer(), emptyEventList, b_one, b_two, b_ld, b_offset, b_buffer, n_ceiled, k_ceiled, n_ceiled, 0, b_temp, - program, true, b_do_transpose, b_conjugate); + ConstantOne<T>(), program, + true, b_do_transpose, b_conjugate); if (ErrorIn(status)) { return status; } eventWaitList.push_back(eventProcessB); } @@ -167,7 +169,8 @@ StatusCode Xgemm<T>::DoGemm(const Layout layout, status = PadCopyTransposeMatrix(eventProcessC.pointer(), emptyEventList, c_one, c_two, c_ld, c_offset, c_buffer, m_ceiled, n_ceiled, m_ceiled, 0, c_temp, - program, true, c_do_transpose, false); + ConstantOne<T>(), program, + true, c_do_transpose, false); if (ErrorIn(status)) { return status; } eventWaitList.push_back(eventProcessC); } @@ -205,7 +208,8 @@ StatusCode Xgemm<T>::DoGemm(const Layout layout, status = PadCopyTransposeMatrix(event_, eventWaitList, m_ceiled, n_ceiled, m_ceiled, 0, c_temp, c_one, c_two, c_ld, c_offset, c_buffer, - program, false, c_do_transpose, false); + ConstantOne<T>(), program, + false, c_do_transpose, false); if (ErrorIn(status)) { return status; } } |