summaryrefslogtreecommitdiff
path: root/test/performance/routines
diff options
context:
space:
mode:
authorCNugteren <web@cedricnugteren.nl>2015-06-23 08:09:46 +0200
committerCNugteren <web@cedricnugteren.nl>2015-06-23 08:09:46 +0200
commit0a3831e6d1eb437a9ef9ac7570f9a554b2c35edb (patch)
tree3ea732cd3efa3cfb23c6e58cb5512a1f7110f748 /test/performance/routines
parent20eb3506d63e21725974e16ae392cf0dd4bf4df5 (diff)
Updated bandwidth computation for GEMM and SYMM
Diffstat (limited to 'test/performance/routines')
-rw-r--r--test/performance/routines/xgemm.cc2
-rw-r--r--test/performance/routines/xsymm.cc2
2 files changed, 2 insertions, 2 deletions
diff --git a/test/performance/routines/xgemm.cc b/test/performance/routines/xgemm.cc
index adff85c8..97e19b44 100644
--- a/test/performance/routines/xgemm.cc
+++ b/test/performance/routines/xgemm.cc
@@ -72,7 +72,7 @@ void PerformanceXgemm(const Arguments<T> &args,
// Prints the performance of both libraries
const auto flops = 2 * args.m * args.n * args.k;
- const auto bytes = (args.m*args.k + args.k*args.n + args.m*args.n) * sizeof(T);
+ const auto bytes = (args.m*args.k + args.k*args.n + 2*args.m*args.n) * sizeof(T);
const auto output_ints = std::vector<size_t>{args.m, args.n, args.k,
static_cast<size_t>(args.layout),
static_cast<size_t>(args.a_transpose),
diff --git a/test/performance/routines/xsymm.cc b/test/performance/routines/xsymm.cc
index 3c9feb05..0b1d75a5 100644
--- a/test/performance/routines/xsymm.cc
+++ b/test/performance/routines/xsymm.cc
@@ -72,7 +72,7 @@ void PerformanceXsymm(const Arguments<T> &args,
// Prints the performance of both libraries
const auto flops = 2 * args.m * args.n * args.m;
- const auto bytes = (args.m*args.m + args.m*args.n + args.m*args.n) * sizeof(T);
+ const auto bytes = (args.m*args.m + args.m*args.n + 2*args.m*args.n) * sizeof(T);
const auto output_ints = std::vector<size_t>{args.m, args.n,
static_cast<size_t>(args.layout),
static_cast<size_t>(args.triangle),