summaryrefslogtreecommitdiff
path: root/test/routines/level3/xtrmm.hpp
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2021-03-15 20:15:02 +0100
committerGitHub <noreply@github.com>2021-03-15 20:15:02 +0100
commitef5176dd968dbf9da7c94506fc0d5f8bd463b293 (patch)
treec2ec91cfcc73fe29de643afc07a68ede3bd39c36 /test/routines/level3/xtrmm.hpp
parentce44c3adb57fc8d464a41d3db8103dc3fe0e86c4 (diff)
parentaec45ea63755a7a9414d7c6a81d570200e948806 (diff)
Merge pull request #416 from JishinMaster/master
set the correct flop count for xgemm
Diffstat (limited to 'test/routines/level3/xtrmm.hpp')
-rw-r--r--test/routines/level3/xtrmm.hpp8
1 files changed, 7 insertions, 1 deletions
diff --git a/test/routines/level3/xtrmm.hpp b/test/routines/level3/xtrmm.hpp
index 51377a16..f39db5cd 100644
--- a/test/routines/level3/xtrmm.hpp
+++ b/test/routines/level3/xtrmm.hpp
@@ -162,7 +162,13 @@ class TestXtrmm {
// Describes how to compute performance metrics
static size_t GetFlops(const Arguments<T> &args) {
auto k = (args.side == Side::kLeft) ? args.m : args.n;
- return args.m * args.n * k;
+ if((args.precision == Precision::kComplexSingle) || (args.precision == Precision::kComplexDouble)) {
+ // complex flops
+ return 4 * args.m * args.n * k;
+ } else {
+ // scalar flops
+ return args.m * args.n * k;
+ }
}
static size_t GetBytes(const Arguments<T> &args) {
auto k = (args.side == Side::kLeft) ? args.m : args.n;