summaryrefslogtreecommitdiff
path: root/scripts/benchmark/settings.py
diff options
context:
space:
mode:
Diffstat (limited to 'scripts/benchmark/settings.py')
-rw-r--r--scripts/benchmark/settings.py85
1 files changed, 38 insertions, 47 deletions
diff --git a/scripts/benchmark/settings.py b/scripts/benchmark/settings.py
index dae1854f..d0d17178 100644
--- a/scripts/benchmark/settings.py
+++ b/scripts/benchmark/settings.py
@@ -10,42 +10,41 @@ import utils
AXPY = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 2, "num_cols": 3,
"benchmarks": [
{
"name": "axpy", "num_runs": 40,
"title": "multiples of 256K",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": utils.k(256), "incx": 1, "incy": 1, "step": utils.k(256), "num_steps": 16}],
},
{
"name": "axpy", "num_runs": 40,
"title": "multiples of 256K+1",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": utils.k(256) + 1, "incx": 1, "incy": 1, "step": utils.k(256) + 1, "num_steps": 16}],
},
{
"name": "axpy", "num_runs": 40,
"title": "around 1M",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": utils.m(1), "incx": 1, "incy": 1, "step": 1, "num_steps": 16}],
},
{
"name": "axpy", "num_runs": 20,
"title": "around 16M",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": utils.m(16), "incx": 1, "incy": 1, "step": 1, "num_steps": 16}],
},
{
"name": "axpy", "num_runs": 20,
"title": "strides n=8M",
"x_label": "increments for x,y", "x_keys": ["incx", "incy"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": utils.m(8), "incx": inc_x, "incy": inc_y, "step": 0, "num_steps": 1}
for inc_x in [1, 2, 4] for inc_y in [1, 2, 4]],
},
@@ -53,7 +52,7 @@ AXPY = {
"name": "axpy", "num_runs": 40,
"title": "powers of 2",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": n, "incx": 1, "incy": 1, "step": 0, "num_steps": 1}
for n in utils.powers_of_2(utils.k(32), utils.m(64))],
}
@@ -61,14 +60,13 @@ AXPY = {
}
AXPYBATCHED = {
- "label_names": ["CLBlast", "clBLAS (non batched)"],
"num_rows": 1, "num_cols": 3,
"benchmarks": [
{
"name": "axpybatched", "num_runs": 30,
"title": "8 AXPYs",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"batch_num": 8, "n": n, "incx": 1, "incy": 1, "step": 0, "num_steps": 1}
for n in utils.powers_of_2(utils.k(8), utils.m(4))],
},
@@ -76,7 +74,7 @@ AXPYBATCHED = {
"name": "axpybatched", "num_runs": 20,
"title": "64 AXPYs",
"x_label": "sizes (n)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"batch_num": 64, "n": n, "incx": 1, "incy": 1, "step": 0, "num_steps": 1}
for n in utils.powers_of_2(utils.k(8), utils.m(4))],
},
@@ -84,7 +82,7 @@ AXPYBATCHED = {
"name": "axpybatched", "num_runs": 40,
"title": "n=512K",
"x_label": "batch size", "x_keys": ["batch_num"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"batch_num": b, "n": utils.k(512), "incx": 1, "incy": 1, "step": 1, "num_steps": 1}
for b in utils.powers_of_2(1, 512)],
}
@@ -92,49 +90,48 @@ AXPYBATCHED = {
}
GEMV = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 2, "num_cols": 3,
"benchmarks": [
{
"name": "gemv", "num_runs": 40,
"title": "multiples of 256",
"x_label": "sizes (n=m)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": 256, "m": 256, "incx": 1, "incy": 1, "layout": 102, "step": 256, "num_steps": 20}],
},
{
"name": "gemv", "num_runs": 40,
"title": "multiples of 257",
"x_label": "sizes (n=m)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": 257, "m": 257, "incx": 1, "incy": 1, "layout": 102, "step": 257, "num_steps": 20}],
},
{
"name": "gemv", "num_runs": 20,
"title": "around 4K",
"x_label": "sizes (n=m)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": 4096, "m": 4096, "incx": 1, "incy": 1, "layout": 102, "step": 1, "num_steps": 16}],
},
{
"name": "gemv", "num_runs": 40,
"title": "multiples of 256 rotated",
"x_label": "sizes (n=m)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": 256, "m": 256, "incx": 1, "incy": 1, "layout": 101, "step": 256, "num_steps": 20}],
},
{
"name": "gemv", "num_runs": 40,
"title": "multiples of 257 rotated",
"x_label": "sizes (n=m)", "x_keys": ["n"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": 257, "m": 257, "incx": 1, "incy": 1, "layout": 101, "step": 257, "num_steps": 20}],
},
{
"name": "gemv", "num_runs": 20,
"title": "strides n=m=4K",
"x_label": "increments/strides for x,y", "x_keys": ["incx", "incy"],
- "y_label": "GB/s (higher is better)", "y_keys": ["GBs_1", "GBs_2"],
+ "y_label": "GB/s (higher is better)", "y_key": "GBs",
"arguments": [{"n": 4096, "m": 4096, "incx": inc_x, "incy": inc_y, "layout": 102, "step": 0, "num_steps": 1}
for inc_x in [1, 2, 4] for inc_y in [1, 2, 4]],
}
@@ -142,14 +139,13 @@ GEMV = {
}
GEMM = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 2, "num_cols": 3,
"benchmarks": [
{
"name": "gemm", "num_runs": 20,
"title": "multiples of 128",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 128, "n": 128, "k": 128, "layout": 102,
"transA": 111, "transB": 111, "step": 128, "num_steps": 20}],
},
@@ -157,7 +153,7 @@ GEMM = {
"name": "gemm", "num_runs": 20,
"title": "multiples of 129",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 129, "n": 129, "k": 129, "layout": 102,
"transA": 111, "transB": 111, "step": 129, "num_steps": 20}],
},
@@ -165,7 +161,7 @@ GEMM = {
"name": "gemm", "num_runs": 20,
"title": "around 512",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 512, "n": 512, "k": 512, "layout": 102,
"transA": 111, "transB": 111, "step": 1, "num_steps": 16}],
},
@@ -173,7 +169,7 @@ GEMM = {
"name": "gemm", "num_runs": 10,
"title": "around 2048",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 2048, "n": 2048, "k": 2048, "layout": 102,
"transA": 111, "transB": 111, "step": 1, "num_steps": 16}],
},
@@ -181,7 +177,7 @@ GEMM = {
"name": "gemm", "num_runs": 10,
"title": "layouts/transpose",
"x_label": "layout, transA, transB", "x_keys": ["layout", "transA", "transB"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 1024, "n": 1024, "k": 1024, "layout": layout,
"transA": transA, "transB": transB, "step": 0, "num_steps": 1}
for layout in [101, 102] for transA in [111, 112] for transB in [111, 112]],
@@ -190,7 +186,7 @@ GEMM = {
"name": "gemm", "num_runs": 10,
"title": "powers of 2",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": n, "n": n, "k": n, "layout": 102,
"transA": 111, "transB": 111, "step": 0, "num_steps": 1}
for n in utils.powers_of_2(8, utils.k(4))],
@@ -199,14 +195,13 @@ GEMM = {
}
GEMM_SMALL = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 2, "num_cols": 1,
"benchmarks": [
{
"name": "gemm", "num_runs": 10,
"title": "small matrices in steps of 16",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 128, "n": 128, "k": 128, "layout": 102,
"transA": 111, "transB": 111, "step": 16, "num_steps": 57}],
},
@@ -214,7 +209,7 @@ GEMM_SMALL = {
"name": "gemm", "num_runs": 10,
"title": "small matrices in steps of 1",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 128, "n": 128, "k": 128, "layout": 102,
"transA": 111, "transB": 111, "step": 1, "num_steps": 385}],
},
@@ -223,14 +218,13 @@ GEMM_SMALL = {
}
GEMMBATCHED = {
- "label_names": ["CLBlast", "clBLAS (non batched)"],
"num_rows": 1, "num_cols": 3,
"benchmarks": [
{
"name": "gemmbatched", "num_runs": 40,
"title": "8 GEMMs",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"batch_num": 8, "m": 32, "n": 32, "k": 32, "layout": 102,
"transA": 111, "transB": 111, "step": 32, "num_steps": 20}],
},
@@ -238,7 +232,7 @@ GEMMBATCHED = {
"name": "gemmbatched", "num_runs": 20,
"title": "64 GEMMs",
"x_label": "sizes (m=n=k)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"batch_num": 64, "m": 32, "n": 32, "k": 32, "layout": 102,
"transA": 111, "transB": 111, "step": 32, "num_steps": 20}],
},
@@ -246,7 +240,7 @@ GEMMBATCHED = {
"name": "gemmbatched", "num_runs": 30,
"title": "m=n=k=128",
"x_label": "batch size", "x_keys": ["batch_num"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"batch_num": b, "m": 128, "n": 128, "k": 128, "layout": 102,
"transA": 111, "transB": 111} for b in utils.powers_of_2(1, utils.k(16))],
}
@@ -254,14 +248,13 @@ GEMMBATCHED = {
}
SYMM = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 2, "num_cols": 3,
"benchmarks": [
{
"name": "symm", "num_runs": 10,
"title": "multiples of 128",
"x_label": "sizes (m=n)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 128, "n": 128, "layout": 102,
"side": 141, "triangle": 121, "step": 128, "num_steps": 20}],
},
@@ -269,7 +262,7 @@ SYMM = {
"name": "symm", "num_runs": 10,
"title": "multiples of 129",
"x_label": "sizes (m=n)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 129, "n": 129, "layout": 102,
"side": 141, "triangle": 121, "step": 129, "num_steps": 20}],
},
@@ -277,7 +270,7 @@ SYMM = {
"name": "symm", "num_runs": 10,
"title": "around 512",
"x_label": "sizes (m=n)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 512, "n": 512, "layout": 102,
"side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
},
@@ -285,7 +278,7 @@ SYMM = {
"name": "symm", "num_runs": 10,
"title": "around 2048",
"x_label": "sizes (m=n)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 2048, "n": 2048, "layout": 102,
"side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
},
@@ -293,7 +286,7 @@ SYMM = {
"name": "symm", "num_runs": 10,
"title": "layouts/sides/triangles",
"x_label": "layout, side, triangle", "x_keys": ["layout", "side", "triangle"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": 1024, "n": 1024, "layout": layout,
"side": side, "triangle": triangle, "step": 0, "num_steps": 1}
for layout in [101, 102] for side in [141, 142] for triangle in [121, 122]],
@@ -302,7 +295,7 @@ SYMM = {
"name": "symm", "num_runs": 10,
"title": "powers of 2",
"x_label": "sizes (m=n)", "x_keys": ["m"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"m": n, "n": n, "layout": 102,
"side": 141, "triangle": 121, "step": 0, "num_steps": 1}
for n in utils.powers_of_2(8, utils.k(4))],
@@ -311,14 +304,13 @@ SYMM = {
}
SYRK = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 2, "num_cols": 3,
"benchmarks": [
{
"name": "syrk", "num_runs": 10,
"title": "multiples of 128",
"x_label": "sizes (n=k)", "x_keys": ["n"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"n": 128, "k": 128, "layout": 102,
"side": 141, "triangle": 121, "step": 128, "num_steps": 20}],
},
@@ -326,7 +318,7 @@ SYRK = {
"name": "syrk", "num_runs": 10,
"title": "multiples of 129",
"x_label": "sizes (n=k)", "x_keys": ["n"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"n": 129, "k": 129, "layout": 102,
"side": 141, "triangle": 121, "step": 129, "num_steps": 20}],
},
@@ -334,7 +326,7 @@ SYRK = {
"name": "syrk", "num_runs": 10,
"title": "around 512",
"x_label": "sizes (n=k)", "x_keys": ["n"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"n": 512, "k": 512, "layout": 102,
"side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
},
@@ -342,7 +334,7 @@ SYRK = {
"name": "syrk", "num_runs": 10,
"title": "around 2048",
"x_label": "sizes (n=k)", "x_keys": ["n"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"n": 2048, "k": 2048, "layout": 102,
"side": 141, "triangle": 121, "step": 1, "num_steps": 16}],
},
@@ -350,7 +342,7 @@ SYRK = {
"name": "syrk", "num_runs": 10,
"title": "layouts/sides/triangles",
"x_label": "layout, triangle, transA", "x_keys": ["layout", "triangle", "transA"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"n": 1024, "k": 1024, "layout": layout,
"triangle": triangle, "transA": transA, "step": 0, "num_steps": 1}
for layout in [101, 102] for triangle in [121, 122] for transA in [111, 112]],
@@ -359,7 +351,7 @@ SYRK = {
"name": "syrk", "num_runs": 10,
"title": "powers of 2",
"x_label": "sizes (n=k)", "x_keys": ["n"],
- "y_label": "GFLOPS (higher is better)", "y_keys": ["GFLOPS_1", "GFLOPS_2"],
+ "y_label": "GFLOPS (higher is better)", "y_key": "GFLOPS",
"arguments": [{"n": n, "k": n, "layout": 102,
"side": 141, "triangle": 121, "step": 0, "num_steps": 1}
for n in utils.powers_of_2(8, utils.k(4))],
@@ -368,7 +360,6 @@ SYRK = {
}
SUMMARY = {
- "label_names": ["CLBlast", "clBLAS"],
"num_rows": 3, "num_cols": 2,
"benchmarks": [
AXPY["benchmarks"][0],