summaryrefslogtreecommitdiff
path: root/test/routines/levelx
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2018-05-09 19:59:31 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2018-05-09 19:59:31 +0200
commitb60828036122c5fe6e0305963ddc1ada6a2effff (patch)
tree58d6b6e6572cc7fe9442d9949a0ac61ba3d8a0bc /test/routines/levelx
parenta4119531eedd5220c9f02c8e1a8a5c3376367049 (diff)
Fixed the performance client for convgemm and added GFLOPS measurements
Diffstat (limited to 'test/routines/levelx')
-rw-r--r--test/routines/levelx/xconvgemm.hpp4
1 files changed, 3 insertions, 1 deletions
diff --git a/test/routines/levelx/xconvgemm.hpp b/test/routines/levelx/xconvgemm.hpp
index 6ca5965b..7233f7b6 100644
--- a/test/routines/levelx/xconvgemm.hpp
+++ b/test/routines/levelx/xconvgemm.hpp
@@ -151,7 +151,9 @@ public:
// Describes how to compute performance metrics
static size_t GetFlops(const Arguments<T> &args) {
- return args.batch_count; // TODO
+ const auto patch_size = args.kernel_h * args.kernel_w * args.channels;
+ const auto num_patches = OutputHeight(args) * OutputWidth(args);
+ return args.batch_count * 2 * num_patches * args.num_kernels * patch_size;
}
static size_t GetBytes(const Arguments<T> &args) {
return (GetSizeA(args) + GetSizeB(args) + GetSizeC(args)) * sizeof(T);