diff options
author | CNugteren <web@cedricnugteren.nl> | 2015-06-14 11:15:53 +0200 |
---|---|---|
committer | CNugteren <web@cedricnugteren.nl> | 2015-06-14 11:15:53 +0200 |
commit | 294a3e3d410c87ffcc7fc550e09b6d45c71a0af8 (patch) | |
tree | d68a45bb8312aabba9589bb1c51b2c6ffe0dc504 /include/internal/database | |
parent | ab0064dab76c83ee9820acb62fa914c493c2563d (diff) |
Split the three variations of the GEMV kernel for maximal tuning freedom
Diffstat (limited to 'include/internal/database')
-rw-r--r-- | include/internal/database/xgemv.h | 44 |
1 files changed, 22 insertions, 22 deletions
diff --git a/include/internal/database/xgemv.h b/include/internal/database/xgemv.h index 37d33487..48ff42c8 100644 --- a/include/internal/database/xgemv.h +++ b/include/internal/database/xgemv.h @@ -18,24 +18,24 @@ const Database::DatabaseEntry Database::XgemvSingle = { "Xgemv", Precision::kSingle, { { // NVIDIA GPUs CL_DEVICE_TYPE_GPU, "NVIDIA Corporation", { - { "GeForce GTX 480", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K20m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K40m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "GeForce GTX 480", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K20m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K40m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // AMD GPUs CL_DEVICE_TYPE_GPU, "AMD", { - { "Tahiti", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "Tahiti", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // Intel GPUs CL_DEVICE_TYPE_GPU, "Intel", { - { "Iris", { {"WGS",128}, {"WPT",4}, {"VW",4} } }, + { "Iris", { {"WGS1",256}, {"WPT1",2}, {"WGS2",64}, {"WPT2",4}, {"VW2",4}, {"WGS3",256}, {"WPT3",2}, {"VW3",8} } }, } }, { // Default CL_DEVICE_TYPE_ALL, kDefault, { - { kDefault, { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { kDefault, { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, } @@ -47,14 +47,14 @@ const Database::DatabaseEntry Database::XgemvDouble = { "Xgemv", Precision::kDouble, { { // NVIDIA GPUs CL_DEVICE_TYPE_GPU, "NVIDIA Corporation", { - { "GeForce GTX 480", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K20m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K40m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "GeForce GTX 480", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K20m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K40m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // AMD GPUs CL_DEVICE_TYPE_GPU, "AMD", { - { "Tahiti", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "Tahiti", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // Intel GPUs @@ -63,7 +63,7 @@ const Database::DatabaseEntry Database::XgemvDouble = { }, { // Default CL_DEVICE_TYPE_ALL, kDefault, { - { kDefault, { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { kDefault, { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, } @@ -74,24 +74,24 @@ const Database::DatabaseEntry Database::XgemvComplexSingle = { "Xgemv", Precision::kComplexSingle, { { // NVIDIA GPUs CL_DEVICE_TYPE_GPU, "NVIDIA Corporation", { - { "GeForce GTX 480", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K20m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K40m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "GeForce GTX 480", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K20m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K40m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // AMD GPUs CL_DEVICE_TYPE_GPU, "AMD", { - { "Tahiti", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "Tahiti", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // Intel GPUs CL_DEVICE_TYPE_GPU, "Intel", { - { "Iris", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "Iris", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // Default CL_DEVICE_TYPE_ALL, kDefault, { - { kDefault, { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { kDefault, { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, } @@ -103,14 +103,14 @@ const Database::DatabaseEntry Database::XgemvComplexDouble = { "Xgemv", Precision::kComplexDouble, { { // NVIDIA GPUs CL_DEVICE_TYPE_GPU, "NVIDIA Corporation", { - { "GeForce GTX 480", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K20m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, - { "Tesla K40m", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "GeForce GTX 480", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K20m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, + { "Tesla K40m", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // AMD GPUs CL_DEVICE_TYPE_GPU, "AMD", { - { "Tahiti", { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { "Tahiti", { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, { // Intel GPUs @@ -119,7 +119,7 @@ const Database::DatabaseEntry Database::XgemvComplexDouble = { }, { // Default CL_DEVICE_TYPE_ALL, kDefault, { - { kDefault, { {"WGS",64}, {"WPT",1}, {"VW",1} } }, + { kDefault, { {"WGS1",64}, {"WPT1",1}, {"WGS2",64}, {"WPT2",1}, {"VW2",1}, {"WGS3",64}, {"WPT3",1}, {"VW3",1} } }, } }, } |