summaryrefslogtreecommitdiff
path: root/src/database/kernels/xgemm/xgemm_64.hpp
diff options
context:
space:
mode:
Diffstat (limited to 'src/database/kernels/xgemm/xgemm_64.hpp')
-rw-r--r--src/database/kernels/xgemm/xgemm_64.hpp29
1 files changed, 24 insertions, 5 deletions
diff --git a/src/database/kernels/xgemm/xgemm_64.hpp b/src/database/kernels/xgemm/xgemm_64.hpp
index 1998d048..35bc204f 100644
--- a/src/database/kernels/xgemm/xgemm_64.hpp
+++ b/src/database/kernels/xgemm/xgemm_64.hpp
@@ -25,8 +25,9 @@ const DatabaseEntry XgemmDouble = {
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 8, 8, 32, 0, 0, 0, 0, 4, 4 } },
} },
{ "Hawaii", {
+ { Name{"AMD FirePro W8100 "}, Params{ 0, 1, 32, 2, 16, 32, 64, 32, 8, 64, 1, 1, 1, 1, 2, 2 } },
{ Name{"AMD Radeon R9 290X "}, Params{ 0, 1, 16, 8, 32, 8, 128, 8, 8, 32, 0, 1, 0, 0, 1, 4 } },
- { kDeviceNameDefault , Params{ 0, 1, 16, 8, 32, 8, 128, 8, 8, 32, 0, 1, 0, 0, 1, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 16, 2, 16, 8, 64, 8, 8, 32, 0, 1, 0, 0, 1, 2 } },
} },
{ "Oland", {
{ Name{"Oland "}, Params{ 0, 1, 16, 2, 8, 16, 64, 16, 8, 16, 0, 0, 1, 1, 1, 1 } },
@@ -75,6 +76,15 @@ const DatabaseEntry XgemmDouble = {
{ Name{"AMD Radeon Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
} },
+ { "gfx902", {
+ { Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 16, 2, 16, 16, 32, 32, 16, 128, 1, 1, 1, 1, 1, 4 } },
+ { Name{"AMD Radeon(TM) RX Vega 10 Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
+ } },
+ { "gfx906:sramecc+:xnack-", {
+ { Name{"AMD Radeon VII "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
+ } },
{ "gfx90c", {
{ Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 16, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 1, 2, 4 } },
{ kDeviceNameDefault , Params{ 0, 1, 16, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 1, 2, 4 } },
@@ -168,6 +178,7 @@ const DatabaseEntry XgemmDouble = {
{ Name{"GeForce GTX 1070 Ti "}, Params{ 0, 1, 32, 2, 8, 8, 32, 16, 16, 32, 0, 0, 0, 0, 1, 2 } },
{ Name{"GeForce GTX 1080 "}, Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 64, 0, 0, 0, 0, 2, 4 } },
{ Name{"GeForce GTX 1080 Ti "}, Params{ 0, 1, 16, 2, 16, 16, 16, 16, 16, 64, 0, 0, 1, 0, 1, 4 } },
+ { Name{"NVIDIA GeForce MX150 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 8, 8, 16, 0, 0, 0, 0, 1, 1 } },
{ Name{"TITAN X (Pascal) "}, Params{ 0, 1, 32, 2, 32, 32, 32, 16, 16, 32, 0, 0, 0, 0, 1, 2 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 64, 0, 0, 0, 0, 2, 4 } },
} },
@@ -177,26 +188,34 @@ const DatabaseEntry XgemmDouble = {
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 8, 8, 64, 0, 0, 0, 0, 2, 4 } },
} },
{ "SM7.5", {
+ { Name{"GeForce GTX 1650 "}, Params{ 1, 8, 1, 1, 4, 4, 32, 32, 32, 128, 0, 0, 0, 0, 4, 4 } },
+ { Name{"NVIDIA GeForce GTX 1650 Ti "}, Params{ 1, 2, 1, 1, 2, 2, 16, 16, 16, 64, 0, 0, 0, 0, 1, 2 } },
+ { Name{"NVIDIA GeForce RTX 2060 "}, Params{ 1, 8, 1, 1, 32, 32, 32, 4, 4, 32, 0, 0, 0, 0, 1, 8 } },
+ { Name{"NVIDIA GeForce RTX 2070 SUPER "}, Params{ 1, 16, 1, 1, 4, 4, 32, 8, 8, 16, 0, 0, 0, 0, 1, 2 } },
+ { Name{"NVIDIA GeForce RTX 2070 Super "}, Params{ 1, 16, 1, 1, 4, 4, 32, 8, 8, 16, 0, 0, 0, 0, 1, 2 } },
+ { Name{"NVIDIA GeForce RTX 2070 with Max-Q Design "}, Params{ 1, 8, 1, 1, 32, 32, 32, 4, 4, 32, 0, 0, 0, 0, 1, 8 } },
{ Name{"NVIDIA GeForce RTX 2080 Ti "}, Params{ 1, 1, 1, 1, 4, 4, 8, 16, 16, 16, 0, 0, 0, 0, 1, 1 } },
+ { Name{"NVIDIA GeForce RTX 2080 with Max-Q Design "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 0, 0, 0, 0, 1, 1 } },
{ Name{"Quadro T2000 "}, Params{ 0, 1, 32, 2, 8, 16, 128, 8, 8, 64, 0, 0, 1, 1, 4, 4 } },
{ Name{"TITAN RTX "}, Params{ 1, 2, 1, 1, 16, 16, 32, 8, 8, 16, 0, 0, 0, 0, 2, 1 } },
{ Name{"Tesla T4 "}, Params{ 0, 1, 32, 2, 8, 16, 128, 8, 8, 64, 0, 0, 1, 1, 4, 4 } },
- { kDeviceNameDefault , Params{ 1, 1, 1, 1, 16, 16, 16, 16, 16, 32, 0, 0, 0, 0, 1, 1 } },
+ { kDeviceNameDefault , Params{ 1, 1, 1, 1, 8, 8, 32, 32, 32, 32, 0, 0, 0, 0, 1, 1 } },
} },
{ "SM8.0", {
{ Name{"A100-PCIE-40GB "}, Params{ 0, 1, 32, 2, 32, 32, 64, 8, 8, 32, 1, 1, 0, 0, 2, 2 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 32, 32, 64, 8, 8, 32, 1, 1, 0, 0, 2, 2 } },
} },
{ "SM8.6", {
- { Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 0, 1, 32, 2, 16, 8, 64, 16, 8, 16, 1, 1, 1, 0, 2, 1 } },
+ { Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 1, 8, 1, 1, 32, 32, 32, 4, 4, 32, 0, 0, 0, 0, 1, 8 } },
{ Name{"NVIDIA GeForce RTX 3080 "}, Params{ 1, 16, 1, 1, 16, 16, 32, 8, 8, 8, 0, 0, 0, 0, 1, 1 } },
{ Name{"NVIDIA GeForce RTX 3080 Laptop GPU "}, Params{ 0, 1, 16, 2, 16, 16, 16, 8, 8, 64, 1, 0, 0, 0, 1, 4 } },
{ Name{"NVIDIA GeForce RTX 3090 "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 1, 1 } },
{ kDeviceNameDefault , Params{ 1, 1, 1, 1, 8, 8, 32, 32, 32, 32, 0, 0, 0, 0, 1, 1 } },
} },
{ "SM8.9", {
+ { Name{"NVIDIA GeForce RTX 4080 "}, Params{ 1, 16, 1, 1, 8, 8, 16, 4, 4, 16, 0, 0, 0, 0, 2, 4 } },
{ Name{"NVIDIA GeForce RTX 4090 "}, Params{ 1, 4, 1, 1, 32, 32, 128, 16, 16, 64, 0, 0, 0, 0, 1, 2 } },
- { kDeviceNameDefault , Params{ 1, 4, 1, 1, 32, 32, 128, 16, 16, 64, 0, 0, 0, 0, 1, 2 } },
+ { kDeviceNameDefault , Params{ 1, 16, 1, 1, 8, 8, 16, 4, 4, 16, 0, 0, 0, 0, 2, 4 } },
} },
{ "default", {
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 2, 2 } },
@@ -206,7 +225,7 @@ const DatabaseEntry XgemmDouble = {
{ // Default
kDeviceTypeAll, "default", {
{ "default", {
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 16, 8, 8, 32, 1, 1, 0, 0, 1, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 32, 1, 1, 0, 0, 2, 4 } },
} },
}
},