diff options
author | Tarmo Räntilä <trantila@iki.fi> | 2019-12-09 22:13:52 +0200 |
---|---|---|
committer | Tarmo Räntilä <trantila@iki.fi> | 2019-12-09 22:13:52 +0200 |
commit | bf50c4e53e1815d4b376f35b5be5c747cd857414 (patch) | |
tree | 8a69853eda4cb591739e08b023f06fab05a05fd9 /src/routines/levelx/xgemmbatched.cpp | |
parent | 6ac74008b6c676ab6834f1c758670c938a0529c3 (diff) |
Reduce TestMatrix calls for xgemmbatched.
Replace the looped test by a single one with the maximal found offset.
Diffstat (limited to 'src/routines/levelx/xgemmbatched.cpp')
-rw-r--r-- | src/routines/levelx/xgemmbatched.cpp | 8 |
1 files changed, 3 insertions, 5 deletions
diff --git a/src/routines/levelx/xgemmbatched.cpp b/src/routines/levelx/xgemmbatched.cpp index b12b8734..0d7ae5ab 100644 --- a/src/routines/levelx/xgemmbatched.cpp +++ b/src/routines/levelx/xgemmbatched.cpp @@ -79,11 +79,9 @@ void XgemmBatched<T>::DoGemmBatched(const Layout layout, const Transpose a_trans gemm_kernel_id); // Tests the matrices for validity - for (auto batch = size_t{0}; batch < batch_count; ++batch) { - TestMatrixA(a_one, a_two, a_buffer, a_offsets[batch], a_ld, false); // don't test for invalid LD - TestMatrixB(b_one, b_two, b_buffer, b_offsets[batch], b_ld, false); // don't test for invalid LD - TestMatrixC(c_one, c_two, c_buffer, c_offsets[batch], c_ld); - } + TestBatchedMatrixA(a_one, a_two, a_buffer, a_offsets, a_ld, false); // don't test for invalid LD + TestBatchedMatrixB(b_one, b_two, b_buffer, b_offsets, b_ld, false); // don't test for invalid LD + TestBatchedMatrixC(c_one, c_two, c_buffer, c_offsets, c_ld); // Upload the scalar arguments to the device auto alphas_device = Buffer<T>(context_, BufferAccess::kReadWrite, batch_count); |