summaryrefslogtreecommitdiff
path: root/test/performance
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-03-05 16:44:16 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2017-03-05 16:44:16 +0100
commit6aba0bbae71702c4eebd88d0fe17739b509185c1 (patch)
tree1b46ef9ebc4c4b0cf4aa7dc4b20fc640440d25b9 /test/performance
parentb114ea49a9228ee7a8bf1b00c092324c0ce972c3 (diff)
Minor fixes to the client w.r.t. the addition of the batch count
Diffstat (limited to 'test/performance')
-rw-r--r--test/performance/client.cpp10
1 files changed, 5 insertions, 5 deletions
diff --git a/test/performance/client.cpp b/test/performance/client.cpp
index b1d5b718..2b4cdb9b 100644
--- a/test/performance/client.cpp
+++ b/test/performance/client.cpp
@@ -91,12 +91,12 @@ Arguments<U> Client<T,U>::ParseArguments(int argc, char *argv[], const size_t le
if (o == kArgAsumOffset) { args.asum_offset = GetArgument(command_line_args, help, kArgAsumOffset, size_t{0}); }
if (o == kArgImaxOffset) { args.imax_offset = GetArgument(command_line_args, help, kArgImaxOffset, size_t{0}); }
+ // Batch arguments
+ if (o == kArgBatchCount) { args.batch_count = GetArgument(command_line_args, help, kArgBatchCount, size_t{1}); }
+
// Scalar values
if (o == kArgAlpha) { args.alpha = GetArgument(command_line_args, help, kArgAlpha, GetScalar<U>()); }
if (o == kArgBeta) { args.beta = GetArgument(command_line_args, help, kArgBeta, GetScalar<U>()); }
-
- // Batch arguments
- if (o == kArgBatchCount) { args.batch_count = GetArgument(command_line_args, help, kArgBatchCount, size_t{1}); }
}
// These are the options common to all routines
@@ -373,8 +373,8 @@ void Client<T,U>::PrintTableRow(const Arguments<U>& args,
for (const auto& timing : timings) {
// Computes the GFLOPS and GB/s metrics
- auto flops = get_flops_(args);
- auto bytes = get_bytes_(args);
+ auto flops = get_flops_(args) * args.batch_count;
+ auto bytes = get_bytes_(args) * args.batch_count;
auto gflops = (timing.second != 0.0) ? (flops*1e-6)/timing.second : 0;
auto gbs = (timing.second != 0.0) ? (bytes*1e-6)/timing.second : 0;