summaryrefslogtreecommitdiff
path: root/src/database/kernels/xgemm
diff options
context:
space:
mode:
Diffstat (limited to 'src/database/kernels/xgemm')
-rw-r--r--src/database/kernels/xgemm/xgemm_16.hpp13
-rw-r--r--src/database/kernels/xgemm/xgemm_32.hpp17
-rw-r--r--src/database/kernels/xgemm/xgemm_3232.hpp19
-rw-r--r--src/database/kernels/xgemm/xgemm_64.hpp13
-rw-r--r--src/database/kernels/xgemm/xgemm_6464.hpp15
5 files changed, 71 insertions, 6 deletions
diff --git a/src/database/kernels/xgemm/xgemm_16.hpp b/src/database/kernels/xgemm/xgemm_16.hpp
index da458699..f683376c 100644
--- a/src/database/kernels/xgemm/xgemm_16.hpp
+++ b/src/database/kernels/xgemm/xgemm_16.hpp
@@ -17,6 +17,7 @@ const DatabaseEntry XgemmHalf = {
{ "Ellesmere", {
{ Name{"AMD Radeon RX 480 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
{ Name{"AMD Radeon RX 580 2048SP "}, Params{ 0, 1, 16, 2, 16, 16, 128, 16, 16, 128, 1, 1, 1, 1, 8, 1 } },
+ { Name{"AMD Radeon RX590 GME "}, Params{ 0, 1, 16, 2, 16, 16, 128, 16, 16, 128, 1, 1, 1, 1, 8, 1 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 1 } },
} },
{ "default", {
@@ -48,6 +49,14 @@ const DatabaseEntry XgemmHalf = {
{ Name{"AMD Radeon Graphics "}, Params{ 0, 1, 16, 2, 8, 8, 64, 8, 8, 128, 1, 1, 1, 0, 2, 1 } },
{ kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 8, 64, 8, 8, 128, 1, 1, 1, 0, 2, 1 } },
} },
+ { "gfx1100", {
+ { Name{"Radeon RX 7900 XTX "}, Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
+ } },
+ { "gfx1102", {
+ { Name{"AMD Radeon RX 7600 "}, Params{ 0, 1, 32, 2, 16, 8, 64, 16, 8, 128, 1, 1, 0, 1, 4, 8 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 8, 64, 16, 8, 128, 1, 1, 0, 1, 4, 8 } },
+ } },
{ "gfx902", {
{ Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
{ Name{"AMD Radeon(TM) RX Vega 10 Graphics "}, Params{ 0, 1, 32, 2, 8, 8, 128, 16, 32, 128, 1, 1, 1, 1, 4, 2 } },
@@ -98,6 +107,10 @@ const DatabaseEntry XgemmHalf = {
{ Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 8, 8, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
} },
+ { "OpenCL C 2.0 Adreno(TM) 640", {
+ { Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 8, 8, 32, 8, 8, 64, 0, 0, 0, 0, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 8, 8, 64, 0, 0, 0, 0, 4, 4 } },
+ } },
{ "OpenCL C 3.0 Adreno(TM) 730", {
{ Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 32, 32, 128, 8, 8, 128, 0, 0, 0, 1, 2, 8 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 32, 32, 128, 8, 8, 128, 0, 0, 0, 1, 2, 8 } },
diff --git a/src/database/kernels/xgemm/xgemm_32.hpp b/src/database/kernels/xgemm/xgemm_32.hpp
index 7913e9ab..209afd04 100644
--- a/src/database/kernels/xgemm/xgemm_32.hpp
+++ b/src/database/kernels/xgemm/xgemm_32.hpp
@@ -17,7 +17,8 @@ const DatabaseEntry XgemmSingle = {
{ "Ellesmere", {
{ Name{"AMD Radeon RX 480 "}, Params{ 0, 1, 32, 2, 8, 8, 16, 16, 16, 64, 1, 1, 0, 0, 1, 2 } },
{ Name{"AMD Radeon RX 580 2048SP "}, Params{ 0, 1, 16, 2, 32, 32, 128, 16, 8, 128, 1, 1, 1, 1, 2, 4 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 2 } },
+ { Name{"AMD Radeon RX590 GME "}, Params{ 0, 1, 32, 2, 16, 16, 64, 32, 16, 128, 1, 1, 0, 1, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
} },
{ "Fiji", {
{ Name{"AMD Radeon R9 Fury X "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
@@ -88,6 +89,14 @@ const DatabaseEntry XgemmSingle = {
{ Name{"AMD Radeon Graphics "}, Params{ 0, 1, 16, 2, 8, 16, 32, 32, 8, 128, 1, 1, 0, 0, 2, 1 } },
{ kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 16, 32, 32, 8, 128, 1, 1, 0, 0, 2, 1 } },
} },
+ { "gfx1100", {
+ { Name{"Radeon RX 7900 XTX "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 32, 0, 1, 1, 0, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 32, 0, 1, 1, 0, 4, 4 } },
+ } },
+ { "gfx1102", {
+ { Name{"AMD Radeon RX 7600 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 32, 8, 128, 0, 1, 1, 0, 1, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 32, 8, 128, 0, 1, 1, 0, 1, 2 } },
+ } },
{ "gfx902", {
{ Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 16, 2, 32, 32, 128, 16, 8, 128, 1, 1, 1, 1, 2, 4 } },
{ Name{"AMD Radeon(TM) RX Vega 10 Graphics "}, Params{ 0, 1, 32, 2, 8, 8, 128, 16, 32, 128, 1, 1, 1, 1, 4, 2 } },
@@ -247,7 +256,9 @@ const DatabaseEntry XgemmSingle = {
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
} },
{ "SM8.6", {
+ { Name{"NVIDIA GeForce RTX 3050 Ti Laptop GPU "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
{ Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 64, 32, 16, 128, 1, 1, 1, 1, 2, 2 } },
+ { Name{"NVIDIA GeForce RTX 3070 Ti Laptop GPU "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } },
{ Name{"NVIDIA GeForce RTX 3080 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 32, 16, 128, 1, 1, 1, 1, 2, 2 } },
{ Name{"NVIDIA GeForce RTX 3080 Laptop GPU "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } },
{ Name{"NVIDIA GeForce RTX 3090 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
@@ -269,6 +280,10 @@ const DatabaseEntry XgemmSingle = {
{ Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 8, 8, 32, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 8, 8, 32, 1, 1, 0, 0, 4, 4 } },
} },
+ { "OpenCL C 2.0 Adreno(TM) 640", {
+ { Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 0, 0, 0, 0, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 0, 0, 0, 0, 4, 4 } },
+ } },
{ "OpenCL C 3.0 Adreno(TM) 730", {
{ Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 128, 0, 0, 1, 0, 2, 4 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 128, 0, 0, 1, 0, 2, 4 } },
diff --git a/src/database/kernels/xgemm/xgemm_3232.hpp b/src/database/kernels/xgemm/xgemm_3232.hpp
index ba2d0d9e..9102a9bf 100644
--- a/src/database/kernels/xgemm/xgemm_3232.hpp
+++ b/src/database/kernels/xgemm/xgemm_3232.hpp
@@ -17,7 +17,8 @@ const DatabaseEntry XgemmComplexSingle = {
{ "Ellesmere", {
{ Name{"AMD Radeon RX 480 "}, Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 32, 1, 1, 0, 0, 1, 4 } },
{ Name{"AMD Radeon RX 580 2048SP "}, Params{ 0, 1, 16, 2, 16, 16, 32, 32, 16, 128, 1, 1, 1, 1, 1, 4 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 32, 1, 1, 0, 0, 1, 4 } },
+ { Name{"AMD Radeon RX590 GME "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 4 } },
} },
{ "Fiji", {
{ Name{"AMD Radeon R9 Fury X "}, Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 32, 1, 1, 0, 0, 1, 2 } },
@@ -84,6 +85,14 @@ const DatabaseEntry XgemmComplexSingle = {
{ Name{"AMD Radeon Graphics "}, Params{ 0, 1, 16, 2, 8, 16, 64, 32, 8, 64, 1, 1, 0, 0, 2, 1 } },
{ kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 16, 64, 32, 8, 64, 1, 1, 0, 0, 2, 1 } },
} },
+ { "gfx1100", {
+ { Name{"Radeon RX 7900 XTX "}, Params{ 0, 1, 32, 2, 8, 8, 32, 8, 16, 64, 1, 0, 1, 1, 4, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 32, 8, 16, 64, 1, 0, 1, 1, 4, 4 } },
+ } },
+ { "gfx1102", {
+ { Name{"AMD Radeon RX 7600 "}, Params{ 0, 1, 16, 2, 32, 32, 64, 16, 8, 128, 0, 0, 1, 1, 2, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 16, 2, 32, 32, 64, 16, 8, 128, 0, 0, 1, 1, 2, 2 } },
+ } },
{ "gfx902", {
{ Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 16, 2, 16, 16, 32, 32, 16, 128, 1, 1, 1, 1, 1, 4 } },
{ Name{"AMD Radeon(TM) RX Vega 10 Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 1 } },
@@ -240,11 +249,13 @@ const DatabaseEntry XgemmComplexSingle = {
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 16, 16, 32, 1, 1, 0, 0, 2, 2 } },
} },
{ "SM8.6", {
+ { Name{"NVIDIA GeForce RTX 3050 Ti Laptop GPU "}, Params{ 0, 1, 16, 2, 16, 8, 64, 8, 16, 64, 1, 1, 1, 1, 1, 4 } },
{ Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 32, 16, 16, 128, 0, 1, 1, 1, 4, 1 } },
+ { Name{"NVIDIA GeForce RTX 3070 Ti Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 32, 16, 16, 128, 0, 1, 1, 1, 4, 1 } },
{ Name{"NVIDIA GeForce RTX 3080 "}, Params{ 1, 8, 1, 1, 8, 8, 64, 8, 8, 64, 0, 0, 0, 0, 4, 8 } },
{ Name{"NVIDIA GeForce RTX 3080 Laptop GPU "}, Params{ 1, 16, 1, 1, 16, 16, 64, 4, 4, 32, 0, 0, 0, 0, 1, 8 } },
{ Name{"NVIDIA GeForce RTX 3090 "}, Params{ 1, 4, 1, 1, 8, 8, 32, 16, 16, 128, 0, 0, 0, 0, 4, 2 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 2, 1 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 0, 0, 0, 0, 1, 2 } },
} },
{ "SM8.9", {
{ Name{"NVIDIA GeForce RTX 4080 "}, Params{ 1, 16, 1, 1, 16, 16, 64, 4, 4, 32, 0, 0, 0, 0, 1, 8 } },
@@ -262,6 +273,10 @@ const DatabaseEntry XgemmComplexSingle = {
{ Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 0, 0, 0, 0, 1, 1 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 0, 0, 0, 0, 1, 1 } },
} },
+ { "OpenCL C 2.0 Adreno(TM) 640", {
+ { Name{"QUALCOMM Adreno(TM) "}, Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 64, 0, 0, 0, 0, 1, 4 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 64, 0, 0, 0, 0, 1, 4 } },
+ } },
}
},
{ // Default
diff --git a/src/database/kernels/xgemm/xgemm_64.hpp b/src/database/kernels/xgemm/xgemm_64.hpp
index 35bc204f..b04c0328 100644
--- a/src/database/kernels/xgemm/xgemm_64.hpp
+++ b/src/database/kernels/xgemm/xgemm_64.hpp
@@ -17,7 +17,8 @@ const DatabaseEntry XgemmDouble = {
{ "Ellesmere", {
{ Name{"AMD Radeon RX 480 "}, Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 64, 1, 1, 0, 0, 2, 2 } },
{ Name{"AMD Radeon RX 580 2048SP "}, Params{ 0, 1, 16, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 1, 2, 4 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 64, 1, 1, 0, 0, 2, 2 } },
+ { Name{"AMD Radeon RX590 GME "}, Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 32, 1, 1, 0, 0, 2, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 32, 1, 1, 0, 0, 2, 2 } },
} },
{ "Fiji", {
{ Name{"AMD Radeon R9 Fury X "}, Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 32, 1, 1, 0, 0, 2, 2 } },
@@ -76,6 +77,14 @@ const DatabaseEntry XgemmDouble = {
{ Name{"AMD Radeon Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } },
} },
+ { "gfx1100", {
+ { Name{"Radeon RX 7900 XTX "}, Params{ 0, 1, 32, 2, 16, 8, 32, 8, 8, 16, 0, 1, 0, 1, 1, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 8, 32, 8, 8, 16, 0, 1, 0, 1, 1, 2 } },
+ } },
+ { "gfx1102", {
+ { Name{"AMD Radeon RX 7600 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 1, 1, 0, 0, 4, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 64, 16, 16, 64, 1, 1, 0, 0, 4, 2 } },
+ } },
{ "gfx902", {
{ Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 16, 2, 16, 16, 32, 32, 16, 128, 1, 1, 1, 1, 1, 4 } },
{ Name{"AMD Radeon(TM) RX Vega 10 Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 1, 1, 0, 0, 4, 2 } },
@@ -206,7 +215,9 @@ const DatabaseEntry XgemmDouble = {
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 32, 32, 64, 8, 8, 32, 1, 1, 0, 0, 2, 2 } },
} },
{ "SM8.6", {
+ { Name{"NVIDIA GeForce RTX 3050 Ti Laptop GPU "}, Params{ 0, 1, 32, 2, 32, 32, 64, 16, 16, 64, 0, 1, 0, 0, 1, 1 } },
{ Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 1, 8, 1, 1, 32, 32, 32, 4, 4, 32, 0, 0, 0, 0, 1, 8 } },
+ { Name{"NVIDIA GeForce RTX 3070 Ti Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 16, 16, 16, 32, 1, 1, 0, 0, 2, 2 } },
{ Name{"NVIDIA GeForce RTX 3080 "}, Params{ 1, 16, 1, 1, 16, 16, 32, 8, 8, 8, 0, 0, 0, 0, 1, 1 } },
{ Name{"NVIDIA GeForce RTX 3080 Laptop GPU "}, Params{ 0, 1, 16, 2, 16, 16, 16, 8, 8, 64, 1, 0, 0, 0, 1, 4 } },
{ Name{"NVIDIA GeForce RTX 3090 "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 1, 1 } },
diff --git a/src/database/kernels/xgemm/xgemm_6464.hpp b/src/database/kernels/xgemm/xgemm_6464.hpp
index 48357083..a48dee39 100644
--- a/src/database/kernels/xgemm/xgemm_6464.hpp
+++ b/src/database/kernels/xgemm/xgemm_6464.hpp
@@ -17,6 +17,7 @@ const DatabaseEntry XgemmComplexDouble = {
{ "Ellesmere", {
{ Name{"AMD Radeon RX 480 "}, Params{ 0, 1, 32, 2, 16, 16, 16, 16, 16, 16, 1, 1, 0, 0, 1, 1 } },
{ Name{"AMD Radeon RX 580 2048SP "}, Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 32, 1, 1, 0, 0, 2, 1 } },
+ { Name{"AMD Radeon RX590 GME "}, Params{ 0, 1, 32, 2, 16, 16, 16, 16, 16, 16, 1, 1, 0, 0, 1, 1 } },
{ kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 16, 16, 16, 16, 1, 1, 0, 0, 1, 1 } },
} },
{ "Fiji", {
@@ -76,6 +77,14 @@ const DatabaseEntry XgemmComplexDouble = {
{ Name{"AMD Radeon Graphics "}, Params{ 1, 2, 1, 1, 4, 4, 32, 8, 8, 32, 0, 0, 0, 0, 8, 2 } },
{ kDeviceNameDefault , Params{ 1, 2, 1, 1, 4, 4, 32, 8, 8, 32, 0, 0, 0, 0, 8, 2 } },
} },
+ { "gfx1100", {
+ { Name{"Radeon RX 7900 XTX "}, Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 16, 1, 1, 0, 0, 2, 1 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 16, 1, 1, 0, 0, 2, 1 } },
+ } },
+ { "gfx1102", {
+ { Name{"AMD Radeon RX 7600 "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 8, 32, 1, 1, 0, 1, 4, 1 } },
+ { kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 8, 32, 8, 8, 32, 1, 1, 0, 1, 4, 1 } },
+ } },
{ "gfx902", {
{ Name{"AMD Radeon(TM) Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 16, 16, 16, 16, 1, 1, 0, 0, 1, 1 } },
{ Name{"AMD Radeon(TM) RX Vega 10 Graphics "}, Params{ 0, 1, 32, 2, 16, 16, 16, 16, 16, 16, 1, 1, 0, 0, 1, 1 } },
@@ -205,11 +214,13 @@ const DatabaseEntry XgemmComplexDouble = {
{ kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 8, 16, 32, 16, 32, 1, 1, 1, 1, 2, 1 } },
} },
{ "SM8.6", {
+ { Name{"NVIDIA GeForce RTX 3050 Ti Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 1, 2 } },
{ Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 16, 16, 16, 16, 1, 1, 0, 0, 2, 1 } },
+ { Name{"NVIDIA GeForce RTX 3070 Ti Laptop GPU "}, Params{ 1, 16, 1, 1, 16, 16, 32, 8, 8, 8, 0, 0, 0, 0, 1, 1 } },
{ Name{"NVIDIA GeForce RTX 3080 "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 1, 2 } },
{ Name{"NVIDIA GeForce RTX 3080 Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 2, 1 } },
{ Name{"NVIDIA GeForce RTX 3090 "}, Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 1, 1 } },
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 1, 1, 0, 0, 2, 1 } },
+ { kDeviceNameDefault , Params{ 1, 1, 1, 1, 8, 8, 32, 32, 32, 32, 0, 0, 0, 0, 1, 1 } },
} },
{ "SM8.9", {
{ Name{"NVIDIA GeForce RTX 4080 "}, Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 16, 1, 1, 0, 0, 2, 2 } },
@@ -217,7 +228,7 @@ const DatabaseEntry XgemmComplexDouble = {
{ kDeviceNameDefault , Params{ 1, 1, 1, 1, 16, 16, 32, 16, 16, 16, 0, 0, 0, 0, 1, 1 } },
} },
{ "default", {
- { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 16, 16, 64, 0, 0, 0, 0, 2, 2 } },
+ { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 16, 8, 8, 16, 1, 1, 0, 0, 1, 2 } },
} },
}
},