diff options
Diffstat (limited to 'src/database/kernels/xgemm/xgemm_32.hpp')
-rw-r--r-- | src/database/kernels/xgemm/xgemm_32.hpp | 11 |
1 files changed, 9 insertions, 2 deletions
diff --git a/src/database/kernels/xgemm/xgemm_32.hpp b/src/database/kernels/xgemm/xgemm_32.hpp index 209afd04..e628aa3b 100644 --- a/src/database/kernels/xgemm/xgemm_32.hpp +++ b/src/database/kernels/xgemm/xgemm_32.hpp @@ -125,7 +125,8 @@ const DatabaseEntry XgemmSingle = { kDeviceTypeGPU, "Apple", { { "default", { { Name{"Apple M1 "}, Params{ 1, 8, 1, 1, 32, 32, 64, 8, 8, 128, 0, 0, 0, 0, 2, 4 } }, - { kDeviceNameDefault , Params{ 1, 8, 1, 1, 32, 32, 64, 8, 8, 128, 0, 0, 0, 0, 2, 4 } }, + { Name{"Apple M2 Max "}, Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 32, 1, 1, 0, 0, 2, 2 } }, + { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 32, 8, 8, 32, 1, 1, 0, 0, 2, 2 } }, } }, } }, @@ -167,6 +168,7 @@ const DatabaseEntry XgemmSingle = { { Name{"Intel(R) HD Graphics IvyBridge M GT2 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } }, { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 1, 2, 1, 1, 4, 4, 32, 8, 8, 64, 0, 0, 0, 0, 2, 2 } }, { Name{"Intel(R) Iris(R) Xe Graphics "}, Params{ 0, 1, 16, 2, 8, 8, 64, 16, 8, 64, 1, 1, 0, 1, 1, 2 } }, + { Name{"Intel(R) RaptorLake-S Mobile Graphics Controller "}, Params{ 0, 1, 16, 2, 16, 16, 64, 16, 8, 128, 1, 1, 0, 1, 1, 8 } }, { Name{"Intel(R) UHD Graphics 620 "}, Params{ 1, 4, 1, 1, 16, 16, 64, 8, 8, 64, 0, 0, 0, 0, 4, 4 } }, { Name{"Intel(R) UHD Graphics 770 "}, Params{ 0, 1, 32, 2, 8, 16, 64, 8, 8, 128, 1, 1, 0, 1, 1, 8 } }, { Name{"Iris "}, Params{ 0, 1, 16, 8, 16, 8, 128, 32, 16, 64, 1, 1, 1, 1, 4, 1 } }, @@ -239,6 +241,7 @@ const DatabaseEntry XgemmSingle = { } }, { "SM7.5", { { Name{"GeForce GTX 1650 "}, Params{ 0, 1, 16, 2, 32, 8, 128, 32, 16, 128, 1, 1, 1, 0, 4, 1 } }, + { Name{"NVIDIA GeForce GTX 1650 SUPER "}, Params{ 0, 1, 32, 2, 8, 8, 64, 32, 16, 128, 1, 1, 1, 1, 2, 2 } }, { Name{"NVIDIA GeForce GTX 1650 Ti "}, Params{ 0, 1, 16, 2, 32, 8, 128, 32, 16, 128, 1, 1, 1, 0, 4, 1 } }, { Name{"NVIDIA GeForce RTX 2060 "}, Params{ 1, 8, 1, 1, 8, 8, 64, 8, 8, 64, 0, 0, 0, 0, 4, 8 } }, { Name{"NVIDIA GeForce RTX 2070 SUPER "}, Params{ 0, 1, 16, 2, 8, 8, 32, 32, 16, 128, 0, 1, 1, 1, 2, 2 } }, @@ -249,7 +252,7 @@ const DatabaseEntry XgemmSingle = { { Name{"Quadro T2000 "}, Params{ 0, 1, 16, 2, 16, 16, 128, 32, 16, 128, 1, 1, 1, 1, 1, 2 } }, { Name{"TITAN RTX "}, Params{ 0, 1, 32, 2, 8, 32, 128, 16, 8, 128, 1, 1, 1, 1, 2, 2 } }, { Name{"Tesla T4 "}, Params{ 0, 1, 16, 2, 16, 16, 128, 32, 16, 128, 1, 1, 1, 1, 1, 2 } }, - { kDeviceNameDefault , Params{ 1, 2, 1, 1, 16, 16, 64, 4, 4, 64, 0, 0, 0, 0, 1, 1 } }, + { kDeviceNameDefault , Params{ 1, 4, 1, 1, 4, 4, 64, 8, 8, 32, 0, 0, 0, 0, 4, 4 } }, } }, { "SM8.0", { { Name{"A100-PCIE-40GB "}, Params{ 0, 1, 32, 2, 8, 8, 32, 16, 16, 64, 1, 1, 0, 0, 4, 4 } }, @@ -258,13 +261,17 @@ const DatabaseEntry XgemmSingle = { { "SM8.6", { { Name{"NVIDIA GeForce RTX 3050 Ti Laptop GPU "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } }, { Name{"NVIDIA GeForce RTX 3060 Laptop GPU "}, Params{ 0, 1, 32, 2, 8, 8, 64, 32, 16, 128, 1, 1, 1, 1, 2, 2 } }, + { Name{"NVIDIA GeForce RTX 3070 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 32, 16, 128, 1, 1, 1, 1, 2, 2 } }, { Name{"NVIDIA GeForce RTX 3070 Ti Laptop GPU "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } }, { Name{"NVIDIA GeForce RTX 3080 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 32, 16, 128, 1, 1, 1, 1, 2, 2 } }, { Name{"NVIDIA GeForce RTX 3080 Laptop GPU "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } }, + { Name{"NVIDIA GeForce RTX 3080 Ti "}, Params{ 0, 1, 16, 2, 8, 8, 32, 32, 16, 128, 0, 1, 1, 1, 2, 2 } }, { Name{"NVIDIA GeForce RTX 3090 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } }, { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 8, 16, 8, 8, 16, 0, 0, 0, 0, 2, 2 } }, } }, { "SM8.9", { + { Name{"NVIDIA GeForce RTX 4070 Laptop GPU "}, Params{ 1, 8, 1, 1, 8, 8, 64, 8, 8, 64, 0, 0, 0, 0, 4, 8 } }, + { Name{"NVIDIA GeForce RTX 4070 Ti "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } }, { Name{"NVIDIA GeForce RTX 4080 "}, Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } }, { Name{"NVIDIA GeForce RTX 4090 "}, Params{ 0, 1, 32, 2, 32, 32, 128, 8, 8, 64, 0, 1, 1, 1, 4, 4 } }, { kDeviceNameDefault , Params{ 0, 1, 16, 2, 8, 8, 32, 8, 16, 128, 1, 0, 1, 1, 4, 8 } }, |