summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2023-01-21 21:13:49 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2023-01-21 21:13:49 +0100
commitc9856758b3c83c53a1185f848f23b55de1c9a2cc (patch)
tree369b50d015c70a02cfcec5ef16b0a8d0112342c1
parentf4a14daf8d1e0f980f9532669647eadb91cdad65 (diff)
Add tuning results for Intel FPGA emulation device
-rw-r--r--src/database/kernels/copy/copy_32.hpp3
-rw-r--r--src/database/kernels/copy/copy_3232.hpp1
-rw-r--r--src/database/kernels/gemm_routine/gemm_routine_32.hpp8
-rw-r--r--src/database/kernels/gemm_routine/gemm_routine_3232.hpp8
-rw-r--r--src/database/kernels/invert/invert_32.hpp8
-rw-r--r--src/database/kernels/invert/invert_3232.hpp8
-rw-r--r--src/database/kernels/pad/pad_32.hpp1
-rw-r--r--src/database/kernels/pad/pad_3232.hpp1
-rw-r--r--src/database/kernels/padtranspose/padtranspose_32.hpp1
-rw-r--r--src/database/kernels/padtranspose/padtranspose_3232.hpp3
-rw-r--r--src/database/kernels/transpose/transpose_32.hpp3
-rw-r--r--src/database/kernels/transpose/transpose_3232.hpp8
-rw-r--r--src/database/kernels/trsv_routine/trsv_routine_32.hpp8
-rw-r--r--src/database/kernels/trsv_routine/trsv_routine_3232.hpp8
-rw-r--r--src/database/kernels/xaxpy/xaxpy_32.hpp3
-rw-r--r--src/database/kernels/xaxpy/xaxpy_3232.hpp1
-rw-r--r--src/database/kernels/xconvgemm/xconvgemm_32.hpp8
-rw-r--r--src/database/kernels/xdot/xdot_32.hpp8
-rw-r--r--src/database/kernels/xdot/xdot_3232.hpp8
-rw-r--r--src/database/kernels/xgemm/xgemm_32.hpp5
-rw-r--r--src/database/kernels/xgemm/xgemm_3232.hpp3
-rw-r--r--src/database/kernels/xgemm_direct/xgemm_direct_32.hpp8
-rw-r--r--src/database/kernels/xgemm_direct/xgemm_direct_3232.hpp8
-rw-r--r--src/database/kernels/xgemv/xgemv_32.hpp3
-rw-r--r--src/database/kernels/xgemv/xgemv_3232.hpp1
-rw-r--r--src/database/kernels/xgemv_fast/xgemv_fast_32.hpp1
-rw-r--r--src/database/kernels/xgemv_fast/xgemv_fast_3232.hpp1
-rw-r--r--src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_32.hpp8
-rw-r--r--src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_3232.hpp8
-rw-r--r--src/database/kernels/xger/xger_32.hpp8
-rw-r--r--src/database/kernels/xger/xger_3232.hpp8
31 files changed, 151 insertions, 8 deletions
diff --git a/src/database/kernels/copy/copy_32.hpp b/src/database/kernels/copy/copy_32.hpp
index 75bd173a..1dfe3d4d 100644
--- a/src/database/kernels/copy/copy_32.hpp
+++ b/src/database/kernels/copy/copy_32.hpp
@@ -118,8 +118,9 @@ const DatabaseEntry CopySingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 16, 8, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 32, 8, 8, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
- { kDeviceNameDefault , Params{ 32, 8, 8, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 32, 8, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
}
},
diff --git a/src/database/kernels/copy/copy_3232.hpp b/src/database/kernels/copy/copy_3232.hpp
index 13bf046e..cd61d720 100644
--- a/src/database/kernels/copy/copy_3232.hpp
+++ b/src/database/kernels/copy/copy_3232.hpp
@@ -115,6 +115,7 @@ const DatabaseEntry CopyComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 32, 8, 1, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 32, 8, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 32, 8, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/gemm_routine/gemm_routine_32.hpp b/src/database/kernels/gemm_routine/gemm_routine_32.hpp
index 17c7412b..54c2362a 100644
--- a/src/database/kernels/gemm_routine/gemm_routine_32.hpp
+++ b/src/database/kernels/gemm_routine/gemm_routine_32.hpp
@@ -58,6 +58,14 @@ const DatabaseEntry GemmRoutineSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1344, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 1344, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM5.0", {
diff --git a/src/database/kernels/gemm_routine/gemm_routine_3232.hpp b/src/database/kernels/gemm_routine/gemm_routine_3232.hpp
index d9d16f9c..a50580c7 100644
--- a/src/database/kernels/gemm_routine/gemm_routine_3232.hpp
+++ b/src/database/kernels/gemm_routine/gemm_routine_3232.hpp
@@ -49,6 +49,14 @@ const DatabaseEntry GemmRoutineComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 832, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 832, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM5.0", {
diff --git a/src/database/kernels/invert/invert_32.hpp b/src/database/kernels/invert/invert_32.hpp
index 979c51aa..c6601c18 100644
--- a/src/database/kernels/invert/invert_32.hpp
+++ b/src/database/kernels/invert/invert_32.hpp
@@ -49,6 +49,14 @@ const DatabaseEntry InvertSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 16, 0, 4, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 16, 0, 4, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM5.0", {
diff --git a/src/database/kernels/invert/invert_3232.hpp b/src/database/kernels/invert/invert_3232.hpp
index 44cbe56b..fb8e72d0 100644
--- a/src/database/kernels/invert/invert_3232.hpp
+++ b/src/database/kernels/invert/invert_3232.hpp
@@ -48,6 +48,14 @@ const DatabaseEntry InvertComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 16, 1, 4, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 16, 1, 4, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM5.0", {
diff --git a/src/database/kernels/pad/pad_32.hpp b/src/database/kernels/pad/pad_32.hpp
index 23d2f5e3..f9f8c4b9 100644
--- a/src/database/kernels/pad/pad_32.hpp
+++ b/src/database/kernels/pad/pad_32.hpp
@@ -117,6 +117,7 @@ const DatabaseEntry PadSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 32, 32, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 32, 16, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 32, 16, 2, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/pad/pad_3232.hpp b/src/database/kernels/pad/pad_3232.hpp
index c4d55e02..cae4e3e2 100644
--- a/src/database/kernels/pad/pad_3232.hpp
+++ b/src/database/kernels/pad/pad_3232.hpp
@@ -115,6 +115,7 @@ const DatabaseEntry PadComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 32, 8, 4, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 32, 8, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 32, 8, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/padtranspose/padtranspose_32.hpp b/src/database/kernels/padtranspose/padtranspose_32.hpp
index 3feba8d1..d0f424d4 100644
--- a/src/database/kernels/padtranspose/padtranspose_32.hpp
+++ b/src/database/kernels/padtranspose/padtranspose_32.hpp
@@ -117,6 +117,7 @@ const DatabaseEntry PadtransposeSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 16, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 0, 16, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 0, 16, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/padtranspose/padtranspose_3232.hpp b/src/database/kernels/padtranspose/padtranspose_3232.hpp
index 83521ed2..2c67c4ab 100644
--- a/src/database/kernels/padtranspose/padtranspose_3232.hpp
+++ b/src/database/kernels/padtranspose/padtranspose_3232.hpp
@@ -115,8 +115,9 @@ const DatabaseEntry PadtransposeComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 0, 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 1, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
- { kDeviceNameDefault , Params{ 1, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 0, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
}
},
diff --git a/src/database/kernels/transpose/transpose_32.hpp b/src/database/kernels/transpose/transpose_32.hpp
index dbeb811a..efdd4a98 100644
--- a/src/database/kernels/transpose/transpose_32.hpp
+++ b/src/database/kernels/transpose/transpose_32.hpp
@@ -116,8 +116,9 @@ const DatabaseEntry TransposeSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 8, 0, 0, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 16, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
- { kDeviceNameDefault , Params{ 16, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 32, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
}
},
diff --git a/src/database/kernels/transpose/transpose_3232.hpp b/src/database/kernels/transpose/transpose_3232.hpp
index 2ad3c281..aca897b3 100644
--- a/src/database/kernels/transpose/transpose_3232.hpp
+++ b/src/database/kernels/transpose/transpose_3232.hpp
@@ -112,6 +112,14 @@ const DatabaseEntry TransposeComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 8, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 8, 0, 0, 4, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/trsv_routine/trsv_routine_32.hpp b/src/database/kernels/trsv_routine/trsv_routine_32.hpp
index 5360d6cf..ccc98856 100644
--- a/src/database/kernels/trsv_routine/trsv_routine_32.hpp
+++ b/src/database/kernels/trsv_routine/trsv_routine_32.hpp
@@ -49,6 +49,14 @@ const DatabaseEntry TrsvRoutineSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 32, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 32, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM6.0", {
diff --git a/src/database/kernels/trsv_routine/trsv_routine_3232.hpp b/src/database/kernels/trsv_routine/trsv_routine_3232.hpp
index 8edeaf83..55328375 100644
--- a/src/database/kernels/trsv_routine/trsv_routine_3232.hpp
+++ b/src/database/kernels/trsv_routine/trsv_routine_3232.hpp
@@ -48,6 +48,14 @@ const DatabaseEntry TrsvRoutineComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 32, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 32, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM6.0", {
diff --git a/src/database/kernels/xaxpy/xaxpy_32.hpp b/src/database/kernels/xaxpy/xaxpy_32.hpp
index 8b5a41ef..2a5d291f 100644
--- a/src/database/kernels/xaxpy/xaxpy_32.hpp
+++ b/src/database/kernels/xaxpy/xaxpy_32.hpp
@@ -117,8 +117,9 @@ const DatabaseEntry XaxpySingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 512, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 2, 1024, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
- { kDeviceNameDefault , Params{ 2, 1024, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 2, 2048, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
}
},
diff --git a/src/database/kernels/xaxpy/xaxpy_3232.hpp b/src/database/kernels/xaxpy/xaxpy_3232.hpp
index 1e811de3..83af95c8 100644
--- a/src/database/kernels/xaxpy/xaxpy_3232.hpp
+++ b/src/database/kernels/xaxpy/xaxpy_3232.hpp
@@ -115,6 +115,7 @@ const DatabaseEntry XaxpyComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 1024, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 1, 1024, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 1, 1024, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/xconvgemm/xconvgemm_32.hpp b/src/database/kernels/xconvgemm/xconvgemm_32.hpp
index 814c46e5..764e6b7c 100644
--- a/src/database/kernels/xconvgemm/xconvgemm_32.hpp
+++ b/src/database/kernels/xconvgemm/xconvgemm_32.hpp
@@ -45,6 +45,14 @@ const DatabaseEntry XconvgemmSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 8, 32, 32, 8, 0, 0, 1, 1, 32, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 1, 8, 32, 32, 8, 0, 0, 1, 1, 32, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM7.0", {
diff --git a/src/database/kernels/xdot/xdot_32.hpp b/src/database/kernels/xdot/xdot_32.hpp
index 394dce19..a793f869 100644
--- a/src/database/kernels/xdot/xdot_32.hpp
+++ b/src/database/kernels/xdot/xdot_32.hpp
@@ -107,6 +107,14 @@ const DatabaseEntry XdotSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1024, 128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 1024, 128, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xdot/xdot_3232.hpp b/src/database/kernels/xdot/xdot_3232.hpp
index 03c4b8ed..06d8190e 100644
--- a/src/database/kernels/xdot/xdot_3232.hpp
+++ b/src/database/kernels/xdot/xdot_3232.hpp
@@ -105,6 +105,14 @@ const DatabaseEntry XdotComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1024, 256, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 1024, 256, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xgemm/xgemm_32.hpp b/src/database/kernels/xgemm/xgemm_32.hpp
index a9b2417f..eb437d86 100644
--- a/src/database/kernels/xgemm/xgemm_32.hpp
+++ b/src/database/kernels/xgemm/xgemm_32.hpp
@@ -117,8 +117,9 @@ const DatabaseEntry XgemmSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 0, 1, 16, 2, 8, 16, 64, 8, 8, 64, 0, 0, 1, 0, 1, 4 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 0, 1, 32, 2, 32, 32, 32, 32, 8, 128, 0, 0, 1, 0, 1, 4 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 32, 32, 32, 32, 8, 128, 0, 0, 1, 0, 1, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 16, 32, 8, 8, 64, 0, 0, 1, 0, 1, 4 } },
} },
}
},
@@ -207,7 +208,7 @@ const DatabaseEntry XgemmSingle = {
{ // Default
kDeviceTypeAll, "default", {
{ "default", {
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 16, 16, 32, 1, 1, 0, 0, 4, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 32, 1, 1, 0, 0, 2, 4 } },
} },
}
},
diff --git a/src/database/kernels/xgemm/xgemm_3232.hpp b/src/database/kernels/xgemm/xgemm_3232.hpp
index ad6470da..f4f43030 100644
--- a/src/database/kernels/xgemm/xgemm_3232.hpp
+++ b/src/database/kernels/xgemm/xgemm_3232.hpp
@@ -111,8 +111,9 @@ const DatabaseEntry XgemmComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 4, 1, 1, 16, 16, 16, 16, 16, 64, 0, 0, 0, 0, 1, 1 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 0, 1, 32, 2, 32, 32, 32, 32, 16, 128, 1, 0, 0, 0, 1, 4 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 32, 32, 32, 32, 16, 128, 1, 0, 0, 0, 1, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 1, 1, 16, 16, 16, 16, 16, 64, 0, 0, 0, 0, 1, 1 } },
} },
}
},
diff --git a/src/database/kernels/xgemm_direct/xgemm_direct_32.hpp b/src/database/kernels/xgemm_direct/xgemm_direct_32.hpp
index 30e62429..511961cc 100644
--- a/src/database/kernels/xgemm_direct/xgemm_direct_32.hpp
+++ b/src/database/kernels/xgemm_direct/xgemm_direct_32.hpp
@@ -88,6 +88,14 @@ const DatabaseEntry XgemmDirectSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 2, 8, 32, 8, 8, 0, 1, 2, 1, 64, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 2, 8, 32, 8, 8, 0, 1, 2, 1, 64, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xgemm_direct/xgemm_direct_3232.hpp b/src/database/kernels/xgemm_direct/xgemm_direct_3232.hpp
index a4226d5e..739b93d9 100644
--- a/src/database/kernels/xgemm_direct/xgemm_direct_3232.hpp
+++ b/src/database/kernels/xgemm_direct/xgemm_direct_3232.hpp
@@ -82,6 +82,14 @@ const DatabaseEntry XgemmDirectComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 2, 32, 32, 8, 8, 1, 1, 1, 2, 32, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 2, 32, 32, 8, 8, 1, 1, 1, 2, 32, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xgemv/xgemv_32.hpp b/src/database/kernels/xgemv/xgemv_32.hpp
index 34519760..6d68708f 100644
--- a/src/database/kernels/xgemv/xgemv_32.hpp
+++ b/src/database/kernels/xgemv/xgemv_32.hpp
@@ -111,8 +111,9 @@ const DatabaseEntry XgemvSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 32, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
- { kDeviceNameDefault , Params{ 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 64, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
}
},
diff --git a/src/database/kernels/xgemv/xgemv_3232.hpp b/src/database/kernels/xgemv/xgemv_3232.hpp
index 1836c3fe..acfbe152 100644
--- a/src/database/kernels/xgemv/xgemv_3232.hpp
+++ b/src/database/kernels/xgemv/xgemv_3232.hpp
@@ -109,6 +109,7 @@ const DatabaseEntry XgemvComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 256, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/xgemv_fast/xgemv_fast_32.hpp b/src/database/kernels/xgemv_fast/xgemv_fast_32.hpp
index 24658d31..89555c1f 100644
--- a/src/database/kernels/xgemv_fast/xgemv_fast_32.hpp
+++ b/src/database/kernels/xgemv_fast/xgemv_fast_32.hpp
@@ -111,6 +111,7 @@ const DatabaseEntry XgemvFastSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 32, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 1, 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 1, 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/xgemv_fast/xgemv_fast_3232.hpp b/src/database/kernels/xgemv_fast/xgemv_fast_3232.hpp
index d41f943c..b38972ac 100644
--- a/src/database/kernels/xgemv_fast/xgemv_fast_3232.hpp
+++ b/src/database/kernels/xgemv_fast/xgemv_fast_3232.hpp
@@ -109,6 +109,7 @@ const DatabaseEntry XgemvFastComplexSingle = {
{ // Intel accelerators
kDeviceTypeAccelerator, "Intel", {
{ "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 1, 128, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ Name{"Intel(R) Many Integrated Core Acceleration Card "}, Params{ 1, 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
{ kDeviceNameDefault , Params{ 1, 64, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
} },
diff --git a/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_32.hpp b/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_32.hpp
index 80c1ee7d..dfcecebf 100644
--- a/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_32.hpp
+++ b/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_32.hpp
@@ -89,6 +89,14 @@ const DatabaseEntry XgemvFastRotSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 8, 16, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 8, 16, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_3232.hpp b/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_3232.hpp
index 29d6caf3..d8eee271 100644
--- a/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_3232.hpp
+++ b/src/database/kernels/xgemv_fast_rot/xgemv_fast_rot_3232.hpp
@@ -87,6 +87,14 @@ const DatabaseEntry XgemvFastRotComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 8, 16, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 8, 16, 8, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xger/xger_32.hpp b/src/database/kernels/xger/xger_32.hpp
index c3fde8c3..857c69c7 100644
--- a/src/database/kernels/xger/xger_32.hpp
+++ b/src/database/kernels/xger/xger_32.hpp
@@ -112,6 +112,14 @@ const DatabaseEntry XgerSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 512, 8, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 512, 8, 2, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {
diff --git a/src/database/kernels/xger/xger_3232.hpp b/src/database/kernels/xger/xger_3232.hpp
index 6f910c18..f98c439a 100644
--- a/src/database/kernels/xger/xger_3232.hpp
+++ b/src/database/kernels/xger/xger_3232.hpp
@@ -110,6 +110,14 @@ const DatabaseEntry XgerComplexSingle = {
} },
}
},
+ { // Intel accelerators
+ kDeviceTypeAccelerator, "Intel", {
+ { "default", {
+ { Name{"Intel(R) FPGA Emulation Device "}, Params{ 128, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ { kDeviceNameDefault , Params{ 128, 4, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 } },
+ } },
+ }
+ },
{ // NVIDIA GPUs
kDeviceTypeGPU, "NVIDIA", {
{ "SM2.0", {