From b4c8e1d9a5804358d6ae350111c85405c3183807 Mon Sep 17 00:00:00 2001
From: Cedric Nugteren <web@cedricnugteren.nl>
Date: Sun, 31 Dec 2017 16:02:46 +0100
Subject: Made plotting script more flexible: extra argument to set the
 comparison library

---
 scripts/benchmark/benchmark.py     | 44 +++++++++++++++-----
 scripts/benchmark/benchmark_all.py |  7 ++--
 scripts/benchmark/settings.py      | 85 +++++++++++++++++---------------------
 3 files changed, 76 insertions(+), 60 deletions(-)

(limited to 'scripts/benchmark')

diff --git a/scripts/benchmark/benchmark.py b/scripts/benchmark/benchmark.py
index 3239d385..d0a9d80f 100644
--- a/scripts/benchmark/benchmark.py
+++ b/scripts/benchmark/benchmark.py
@@ -27,8 +27,12 @@ EXPERIMENTS = {
     "summary": settings.SUMMARY,
 }
 
+COMPARISONS = ["clBLAS", "CPU-BLAS", "cuBLAS"]
+COMPARISON_ARGS = ["-clblas", "-cblas", "-cublas"]
+COMPARISON_IDS = [2, 3, 4]
 
-def run_benchmark(name, arguments_list, precision, num_runs, platform, device):
+
+def run_benchmark(name, arguments_list, precision, num_runs, platform, device, comparisons):
     binary = "./clblast_client_x" + name
 
     # Loops over sub-benchmarks per benchmark
@@ -36,10 +40,16 @@ def run_benchmark(name, arguments_list, precision, num_runs, platform, device):
     for arguments in arguments_list:
 
         # Sets the arguments
-        constant_arguments = ["-warm_up", "-q", "-no_abbrv", "-cblas 0", "-cublas 0"]
+        constant_arguments = ["-warm_up", "-q", "-no_abbrv"]
         common_arguments = ["-precision %d" % precision, "-runs %d" % num_runs]
         opencl_arguments = ["-platform %d" % platform, "-device %d" % device]
-        all_arguments = opencl_arguments + common_arguments + constant_arguments
+        comparison_arguments = []
+        for name, arg in zip(COMPARISONS, COMPARISON_ARGS):
+            if name in comparisons:
+                comparison_arguments.append(arg + " 1")
+            else:
+                comparison_arguments.append(arg + " 0")
+        all_arguments = opencl_arguments + common_arguments + constant_arguments + comparison_arguments
         for name, value in arguments.items():
             all_arguments.append("-" + name + " " + str(value))
 
@@ -54,9 +64,11 @@ def run_benchmark(name, arguments_list, precision, num_runs, platform, device):
             result_extra = utils.parse_results(benchmark_output)
             for index in range(len(min(result, result_extra))):
                 result[index]["GBs_1_FP32"] = result_extra[index]["GBs_1"]
-                result[index]["GBs_2"] = result_extra[index]["GBs_2"]
                 result[index]["GFLOPS_1_FP32"] = result_extra[index]["GFLOPS_1"]
-                result[index]["GFLOPS_2"] = result_extra[index]["GFLOPS_2"]
+                for id in COMPARISON_IDS:
+                    if "GBs_%d" % id in result_extra[index].keys():
+                        result[index]["GBs_%d" % id] = result_extra[index]["GBs_%d" % id]
+                        result[index]["GFLOPS_%d" % id] = result_extra[index]["GFLOPS_%d" % id]
 
         results.extend(result)
     return results
@@ -65,6 +77,7 @@ def run_benchmark(name, arguments_list, precision, num_runs, platform, device):
 def parse_arguments(argv):
     parser = argparse.ArgumentParser(description="Runs a full benchmark for a specific routine on a specific device")
     parser.add_argument("-b", "--benchmark", required=True, help="The benchmark to perform (choose from %s)" % sorted(EXPERIMENTS.keys()))
+    parser.add_argument("-c", "--comparisons", default=[], nargs='+', help="The library(s) to compare against (choose from %s)" % COMPARISONS)
     parser.add_argument("-p", "--platform", required=True, type=int, help="The ID of the OpenCL platform to test on")
     parser.add_argument("-d", "--device", required=True, type=int, help="The ID of the OpenCL device to test on")
     parser.add_argument("-n", "--num_runs", type=int, default=None, help="Overrides the default number of benchmark repeats for averaging")
@@ -78,7 +91,7 @@ def parse_arguments(argv):
     return vars(cl_args)
 
 
-def benchmark_single(benchmark, platform, device, num_runs, precision, load_from_disk,
+def benchmark_single(benchmark, comparisons, platform, device, num_runs, precision, load_from_disk,
                      plot_title, tight_plot, output_folder, verbose):
 
     # Sanity check
@@ -91,6 +104,14 @@ def benchmark_single(benchmark, platform, device, num_runs, precision, load_from
     if benchmark.upper() != "SUMMARY":
         plot_title = benchmark_name if plot_title is "" else benchmark_name + ": " + plot_title
 
+    # Retrieves the comparison settings
+    library_ids = [1]
+    for comparison in comparisons:
+        if comparison not in COMPARISONS:
+            print("[benchmark] Invalid comparison library '%s', choose from %s" % (comparison, COMPARISONS))
+            return
+        library_ids.append(COMPARISON_IDS[COMPARISONS.index(comparison)])
+
     # Retrieves the benchmark settings
     if benchmark not in EXPERIMENTS.keys():
         print("[benchmark] Invalid benchmark '%s', choose from %s" % (benchmark, EXPERIMENTS.keys()))
@@ -109,13 +130,13 @@ def benchmark_single(benchmark, platform, device, num_runs, precision, load_from
         # Runs all the individual benchmarks
         print("[benchmark] Running on platform %d, device %d" % (platform, device))
         print("[benchmark] Running %d benchmarks for settings '%s'" % (len(benchmarks), benchmark))
-        results = {"label_names": experiment["label_names"], "num_rows": experiment["num_rows"],
+        results = {"label_names": ["CLBlast"] + comparisons, "num_rows": experiment["num_rows"],
                    "num_cols": experiment["num_cols"], "benchmarks": []}
         for bench in benchmarks:
             num_runs_benchmark = bench["num_runs"] if num_runs is None else num_runs
             print("[benchmark] Running benchmark '%s:%s'" % (bench["name"], bench["title"]))
             result = run_benchmark(bench["name"], bench["arguments"], precision, num_runs_benchmark,
-                                   platform, device)
+                                   platform, device, comparisons)
             results["benchmarks"].append(result)
 
         # Stores the results to disk
@@ -128,14 +149,17 @@ def benchmark_single(benchmark, platform, device, num_runs, precision, load_from
     pdf_file_name = os.path.join(output_folder, benchmark_name.lower() + "_plot" + file_name_suffix + ".pdf")
     titles = [utils.precision_to_letter(precision) + b["name"].upper() + " " + b["title"] for b in benchmarks]
     x_keys = [b["x_keys"] for b in benchmarks]
-    y_keys = [b["y_keys"] for b in benchmarks]
+    y_keys = [["%s_%d" % (b["y_key"], i) for i in library_ids] for b in benchmarks]
     x_labels = [b["x_label"] for b in benchmarks]
     y_labels = [b["y_label"] for b in benchmarks]
     label_names = results["label_names"]
 
     # For half-precision: also adds single-precision results for comparison
     if precision == 16:
-        label_names = ["CLBlast FP16", "clBLAS FP32", "CLBlast FP32"]
+        label_names[0] += " FP16"
+        for index in range(1, len(label_names)):
+            label_names[index] += " FP32"
+        label_names.append("CLBlast FP32")
         y_keys = [y_key + [y_key[0] + "_FP32"] for y_key in y_keys]
 
     # Plots the graphs
diff --git a/scripts/benchmark/benchmark_all.py b/scripts/benchmark/benchmark_all.py
index 9bf09190..2a7f6c9a 100644
--- a/scripts/benchmark/benchmark_all.py
+++ b/scripts/benchmark/benchmark_all.py
@@ -10,7 +10,7 @@ import argparse
 import os
 import sys
 
-from benchmark import benchmark_single
+from benchmark import benchmark_single, COMPARISONS
 
 
 BENCHMARKS = ["axpy", "gemv", "gemm", "summary", "axpybatched", "gemmbatched"]
@@ -18,6 +18,7 @@ BENCHMARKS = ["axpy", "gemv", "gemm", "summary", "axpybatched", "gemmbatched"]
 
 def parse_arguments(argv):
     parser = argparse.ArgumentParser(description="Runs all (main) benchmarks in one go for a given device")
+    parser.add_argument("-c", "--comparisons", default=[], nargs='+', help="The library(s) to compare against (choose from %s)" % COMPARISONS)
     parser.add_argument("-p", "--platform", required=True, type=int, help="The ID of the OpenCL platform to test on")
     parser.add_argument("-d", "--device", required=True, type=int, help="The ID of the OpenCL device to test on")
     parser.add_argument("-x", "--precision", type=int, default=32, help="The precision to test for (choose from 16, 32, 64, 3232, 6464")
@@ -29,12 +30,12 @@ def parse_arguments(argv):
     return vars(cl_args)
 
 
-def benchmark_all(platform, device, precision, load_from_disk,
+def benchmark_all(comparisons, platform, device, precision, load_from_disk,
                   plot_title, output_folder, verbose):
     for bench in BENCHMARKS:
         from_disk = load_from_disk
         for tight_plot in [True, False]:  # two plots for a single benchmark
-            benchmark_single(bench, platform, device, None, precision, from_disk,
+            benchmark_single(bench, comparisons, platform, device, None, precision, from_disk,
                              plot_title, tight_plot, output_folder, verbose)
             from_disk = True  # for the next plot of the same data
 
diff --git a/scripts/benchmark/settings.py b/scripts/benchmark/settings.py
index dae1854f..d0d17178 100644
--- a/scripts/benchmark/settings.py
+++ b/scripts/benchmark/settings.py
@@ -10,42 +10,41 @@ import utils
 
 
 AXPY = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 2, "num_cols": 3,
     "benchmarks": [
         {
             "name": "axpy", "num_runs": 40,
             "title": "multiples of 256K",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": utils.k(256), "incx": 1, "incy": 1, "step": utils.k(256), "num_steps": 16}],
         },
         {
             "name": "axpy", "num_runs": 40,
             "title": "multiples of 256K+1",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": utils.k(256) + 1, "incx": 1, "incy": 1, "step": utils.k(256) + 1, "num_steps": 16}],
         },
         {
             "name": "axpy", "num_runs": 40,
             "title": "around 1M",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": utils.m(1), "incx": 1, "incy": 1, "step": 1, "num_steps": 16}],
         },
         {
             "name": "axpy", "num_runs": 20,
             "title": "around 16M",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": utils.m(16), "incx": 1, "incy": 1, "step": 1, "num_steps": 16}],
         },
         {
             "name": "axpy", "num_runs": 20,
             "title": "strides n=8M",
             "x_label": "increments for x,y", "x_keys": ["incx", "incy"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": utils.m(8), "incx": inc_x, "incy": inc_y, "step": 0, "num_steps": 1}
                           for inc_x in [1, 2, 4] for inc_y in [1, 2, 4]],
         },
@@ -53,7 +52,7 @@ AXPY = {
             "name": "axpy", "num_runs": 40,
             "title": "powers of 2",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": n, "incx": 1, "incy": 1, "step": 0, "num_steps": 1}
                           for n in utils.powers_of_2(utils.k(32), utils.m(64))],
         }
@@ -61,14 +60,13 @@ AXPY = {
 }
 
 AXPYBATCHED = {
-    "label_names": ["CLBlast", "clBLAS (non batched)"],
     "num_rows": 1, "num_cols": 3,
     "benchmarks": [
         {
             "name": "axpybatched", "num_runs": 30,
             "title": "8 AXPYs",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"batch_num": 8, "n": n, "incx": 1, "incy": 1, "step": 0, "num_steps": 1}
                           for n in utils.powers_of_2(utils.k(8), utils.m(4))],
         },
@@ -76,7 +74,7 @@ AXPYBATCHED = {
             "name": "axpybatched", "num_runs": 20,
             "title": "64 AXPYs",
             "x_label": "sizes (n)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"batch_num": 64, "n": n, "incx": 1, "incy": 1, "step": 0, "num_steps": 1}
                           for n in utils.powers_of_2(utils.k(8), utils.m(4))],
         },
@@ -84,7 +82,7 @@ AXPYBATCHED = {
             "name": "axpybatched", "num_runs": 40,
             "title": "n=512K",
             "x_label": "batch size", "x_keys": ["batch_num"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"batch_num": b, "n": utils.k(512), "incx": 1, "incy": 1, "step": 1, "num_steps": 1}
                           for b in utils.powers_of_2(1, 512)],
         }
@@ -92,49 +90,48 @@ AXPYBATCHED = {
 }
 
 GEMV = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 2, "num_cols": 3,
     "benchmarks": [
         {
             "name": "gemv", "num_runs": 40,
             "title": "multiples of 256",
             "x_label": "sizes (n=m)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": 256, "m": 256, "incx": 1, "incy": 1, "layout": 102, "step": 256, "num_steps": 20}],
         },
         {
             "name": "gemv", "num_runs": 40,
             "title": "multiples of 257",
             "x_label": "sizes (n=m)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": 257, "m": 257, "incx": 1, "incy": 1, "layout": 102, "step": 257, "num_steps": 20}],
         },
         {
             "name": "gemv", "num_runs": 20,
             "title": "around 4K",
             "x_label": "sizes (n=m)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": 4096, "m": 4096, "incx": 1, "incy": 1, "layout": 102, "step": 1, "num_steps": 16}],
         },
         {
             "name": "gemv", "num_runs": 40,
             "title": "multiples of 256 rotated",
             "x_label": "sizes (n=m)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": 256, "m": 256, "incx": 1, "incy": 1, "layout": 101, "step": 256, "num_steps": 20}],
         },
         {
             "name": "gemv", "num_runs": 40,
             "title": "multiples of 257 rotated",
             "x_label": "sizes (n=m)", "x_keys": ["n"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": 257, "m": 257, "incx": 1, "incy": 1, "layout": 101, "step": 257, "num_steps": 20}],
         },
         {
             "name": "gemv", "num_runs": 20,
             "title": "strides n=m=4K",
             "x_label": "increments/strides for x,y", "x_keys": ["incx", "incy"],
-            "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+            "y_label": "GB/s (higher is better)", "y_key": "GBs",
             "arguments": [{"n": 4096, "m": 4096, "incx": inc_x, "incy": inc_y, "layout": 102, "step": 0, "num_steps": 1}
                           for inc_x in [1, 2, 4] for inc_y in [1, 2, 4]],
         }
@@ -142,14 +139,13 @@ GEMV = {
 }
 
 GEMM = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 2, "num_cols": 3,
     "benchmarks": [
         {
             "name": "gemm", "num_runs": 20,
             "title": "multiples of 128",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 128, "n": 128, "k": 128, "layout": 102,
                            "transA": 111, "transB": 111, "step": 128, "num_steps": 20}],
         },
@@ -157,7 +153,7 @@ GEMM = {
             "name": "gemm", "num_runs": 20,
             "title": "multiples of 129",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 129, "n": 129, "k": 129, "layout": 102,
                            "transA": 111, "transB": 111, "step": 129, "num_steps": 20}],
         },
@@ -165,7 +161,7 @@ GEMM = {
             "name": "gemm", "num_runs": 20,
             "title": "around 512",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 512, "n": 512, "k": 512, "layout": 102,
                            "transA": 111, "transB": 111, "step": 1, "num_steps": 16}],
         },
@@ -173,7 +169,7 @@ GEMM = {
             "name": "gemm", "num_runs": 10,
             "title": "around 2048",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 2048, "n": 2048, "k": 2048, "layout": 102,
                            "transA": 111, "transB": 111, "step": 1, "num_steps": 16}],
         },
@@ -181,7 +177,7 @@ GEMM = {
             "name": "gemm", "num_runs": 10,
             "title": "layouts/transpose",
             "x_label": "layout, transA, transB", "x_keys": ["layout", "transA", "transB"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 1024, "n": 1024, "k": 1024, "layout": layout,
                            "transA": transA, "transB": transB, "step": 0, "num_steps": 1}
                           for layout in [101, 102] for transA in [111, 112] for transB in [111, 112]],
@@ -190,7 +186,7 @@ GEMM = {
             "name": "gemm", "num_runs": 10,
             "title": "powers of 2",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": n, "n": n, "k": n, "layout": 102,
                            "transA": 111, "transB": 111, "step": 0, "num_steps": 1}
                           for n in utils.powers_of_2(8, utils.k(4))],
@@ -199,14 +195,13 @@ GEMM = {
 }
 
 GEMM_SMALL = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 2, "num_cols": 1,
     "benchmarks": [
         {
             "name": "gemm", "num_runs": 10,
             "title": "small matrices in steps of 16",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 128, "n": 128, "k": 128, "layout": 102,
                            "transA": 111, "transB": 111, "step": 16, "num_steps": 57}],
         },
@@ -214,7 +209,7 @@ GEMM_SMALL = {
             "name": "gemm", "num_runs": 10,
             "title": "small matrices in steps of 1",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 128, "n": 128, "k": 128, "layout": 102,
                            "transA": 111, "transB": 111, "step": 1, "num_steps": 385}],
         },
@@ -223,14 +218,13 @@ GEMM_SMALL = {
 }
 
 GEMMBATCHED = {
-    "label_names": ["CLBlast", "clBLAS (non batched)"],
     "num_rows": 1, "num_cols": 3,
     "benchmarks": [
         {
             "name": "gemmbatched", "num_runs": 40,
             "title": "8 GEMMs",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"batch_num": 8, "m": 32, "n": 32, "k": 32, "layout": 102,
                            "transA": 111, "transB": 111, "step": 32, "num_steps": 20}],
         },
@@ -238,7 +232,7 @@ GEMMBATCHED = {
             "name": "gemmbatched", "num_runs": 20,
             "title": "64 GEMMs",
             "x_label": "sizes (m=n=k)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"batch_num": 64, "m": 32, "n": 32, "k": 32, "layout": 102,
                            "transA": 111, "transB": 111, "step": 32, "num_steps": 20}],
         },
@@ -246,7 +240,7 @@ GEMMBATCHED = {
             "name": "gemmbatched", "num_runs": 30,
             "title": "m=n=k=128",
             "x_label": "batch size", "x_keys": ["batch_num"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"batch_num": b, "m": 128, "n": 128, "k": 128, "layout": 102,
                            "transA": 111, "transB": 111} for b in utils.powers_of_2(1, utils.k(16))],
         }
@@ -254,14 +248,13 @@ GEMMBATCHED = {
 }
 
 SYMM = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 2, "num_cols": 3,
     "benchmarks": [
         {
             "name": "symm", "num_runs": 10,
             "title": "multiples of 128",
             "x_label": "sizes (m=n)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 128, "n": 128, "layout": 102,
                            "side": 141, "triangle": 121, "step": 128, "num_steps": 20}],
         },
@@ -269,7 +262,7 @@ SYMM = {
             "name": "symm", "num_runs": 10,
             "title": "multiples of 129",
             "x_label": "sizes (m=n)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 129, "n": 129, "layout": 102,
                            "side": 141, "triangle": 121, "step": 129, "num_steps": 20}],
         },
@@ -277,7 +270,7 @@ SYMM = {
             "name": "symm", "num_runs": 10,
             "title": "around 512",
             "x_label": "sizes (m=n)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 512, "n": 512, "layout": 102,
                            "side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
         },
@@ -285,7 +278,7 @@ SYMM = {
             "name": "symm", "num_runs": 10,
             "title": "around 2048",
             "x_label": "sizes (m=n)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 2048, "n": 2048, "layout": 102,
                            "side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
         },
@@ -293,7 +286,7 @@ SYMM = {
             "name": "symm", "num_runs": 10,
             "title": "layouts/sides/triangles",
             "x_label": "layout, side, triangle", "x_keys": ["layout", "side", "triangle"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": 1024, "n": 1024, "layout": layout,
                            "side": side, "triangle": triangle, "step": 0, "num_steps": 1}
                           for layout in [101, 102] for side in [141, 142] for triangle in [121, 122]],
@@ -302,7 +295,7 @@ SYMM = {
             "name": "symm", "num_runs": 10,
             "title": "powers of 2",
             "x_label": "sizes (m=n)", "x_keys": ["m"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"m": n, "n": n, "layout": 102,
                            "side": 141, "triangle": 121, "step": 0, "num_steps": 1}
                           for n in utils.powers_of_2(8, utils.k(4))],
@@ -311,14 +304,13 @@ SYMM = {
 }
 
 SYRK = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 2, "num_cols": 3,
     "benchmarks": [
         {
             "name": "syrk", "num_runs": 10,
             "title": "multiples of 128",
             "x_label": "sizes (n=k)", "x_keys": ["n"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"n": 128, "k": 128, "layout": 102,
                            "side": 141, "triangle": 121, "step": 128, "num_steps": 20}],
         },
@@ -326,7 +318,7 @@ SYRK = {
             "name": "syrk", "num_runs": 10,
             "title": "multiples of 129",
             "x_label": "sizes (n=k)", "x_keys": ["n"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"n": 129, "k": 129, "layout": 102,
                            "side": 141, "triangle": 121, "step": 129, "num_steps": 20}],
         },
@@ -334,7 +326,7 @@ SYRK = {
             "name": "syrk", "num_runs": 10,
             "title": "around 512",
             "x_label": "sizes (n=k)", "x_keys": ["n"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"n": 512, "k": 512, "layout": 102,
                            "side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
         },
@@ -342,7 +334,7 @@ SYRK = {
             "name": "syrk", "num_runs": 10,
             "title": "around 2048",
             "x_label": "sizes (n=k)", "x_keys": ["n"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"n": 2048, "k": 2048, "layout": 102,
                            "side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
         },
@@ -350,7 +342,7 @@ SYRK = {
             "name": "syrk", "num_runs": 10,
             "title": "layouts/sides/triangles",
             "x_label": "layout, triangle, transA", "x_keys": ["layout", "triangle", "transA"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"n": 1024, "k": 1024, "layout": layout,
                            "triangle": triangle, "transA": transA, "step": 0, "num_steps": 1}
                           for layout in [101, 102] for triangle in [121, 122] for transA in [111, 112]],
@@ -359,7 +351,7 @@ SYRK = {
             "name": "syrk", "num_runs": 10,
             "title": "powers of 2",
             "x_label": "sizes (n=k)", "x_keys": ["n"],
-            "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+            "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
             "arguments": [{"n": n, "k": n, "layout": 102,
                            "side": 141, "triangle": 121, "step": 0, "num_steps": 1}
                           for n in utils.powers_of_2(8, utils.k(4))],
@@ -368,7 +360,6 @@ SYRK = {
 }
 
 SUMMARY = {
-    "label_names": ["CLBlast", "clBLAS"],
     "num_rows": 3, "num_cols": 2,
     "benchmarks": [
         AXPY["benchmarks"][0],
-- 
cgit v1.2.3