diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2016-05-16 12:45:10 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2016-05-16 12:45:10 +0200 |
commit | 7a3b695db70810595ae17d9d753c3b926aa738c0 (patch) | |
tree | 2ba239884a8f20e34449bee35bc96b94b84954eb /include | |
parent | af2ac6221288ec101a69018e960bb004ad698efe (diff) |
Added half precision tuning results for supporting kernels (pad, copy, transpose, padtranspose)
Diffstat (limited to 'include')
-rw-r--r-- | include/internal/database.h | 8 | ||||
-rw-r--r-- | include/internal/database/copy.h | 18 | ||||
-rw-r--r-- | include/internal/database/pad.h | 18 | ||||
-rw-r--r-- | include/internal/database/padtranspose.h | 18 | ||||
-rw-r--r-- | include/internal/database/transpose.h | 18 |
5 files changed, 76 insertions, 4 deletions
diff --git a/include/internal/database.h b/include/internal/database.h index 5bf69358..f66edcac 100644 --- a/include/internal/database.h +++ b/include/internal/database.h @@ -72,10 +72,10 @@ class Database { static const DatabaseEntry XgemvSingle, XgemvDouble, XgemvComplexSingle, XgemvComplexDouble; static const DatabaseEntry XgerSingle, XgerDouble, XgerComplexSingle, XgerComplexDouble; static const DatabaseEntry XgemmSingle, XgemmDouble, XgemmComplexSingle, XgemmComplexDouble; - static const DatabaseEntry CopySingle, CopyDouble, CopyComplexSingle, CopyComplexDouble; - static const DatabaseEntry PadSingle, PadDouble, PadComplexSingle, PadComplexDouble; - static const DatabaseEntry TransposeSingle, TransposeDouble, TransposeComplexSingle, TransposeComplexDouble; - static const DatabaseEntry PadtransposeSingle, PadtransposeDouble, PadtransposeComplexSingle, PadtransposeComplexDouble; + static const DatabaseEntry CopyHalf, CopySingle, CopyDouble, CopyComplexSingle, CopyComplexDouble; + static const DatabaseEntry PadHalf, PadSingle, PadDouble, PadComplexSingle, PadComplexDouble; + static const DatabaseEntry TransposeHalf, TransposeSingle, TransposeDouble, TransposeComplexSingle, TransposeComplexDouble; + static const DatabaseEntry PadtransposeHalf, PadtransposeSingle, PadtransposeDouble, PadtransposeComplexSingle, PadtransposeComplexDouble; static const std::vector<DatabaseEntry> database; // The constructor diff --git a/include/internal/database/copy.h b/include/internal/database/copy.h index 59a9e03a..b4695868 100644 --- a/include/internal/database/copy.h +++ b/include/internal/database/copy.h @@ -14,6 +14,24 @@ namespace clblast { // ================================================================================================= +const Database::DatabaseEntry Database::CopyHalf = { + "Copy", Precision::kHalf, { + { // Intel GPUs + kDeviceTypeGPU, "Intel", { + { "Intel(R) HD Graphics Skylake ULT GT2", { {"COPY_DIMX",32}, {"COPY_DIMY",8}, {"COPY_VW",4}, {"COPY_WPT",4} } }, + { "default", { {"COPY_DIMX",32}, {"COPY_DIMY",8}, {"COPY_VW",4}, {"COPY_WPT",4} } }, + } + }, + { // Default + kDeviceTypeAll, "default", { + { "default", { {"COPY_DIMX",32}, {"COPY_DIMY",8}, {"COPY_VW",4}, {"COPY_WPT",4} } }, + } + }, + } +}; + +// ================================================================================================= + const Database::DatabaseEntry Database::CopySingle = { "Copy", Precision::kSingle, { { // AMD GPUs diff --git a/include/internal/database/pad.h b/include/internal/database/pad.h index d2de19e4..aae7631b 100644 --- a/include/internal/database/pad.h +++ b/include/internal/database/pad.h @@ -14,6 +14,24 @@ namespace clblast { // ================================================================================================= +const Database::DatabaseEntry Database::PadHalf = { + "Pad", Precision::kHalf, { + { // Intel GPUs + kDeviceTypeGPU, "Intel", { + { "Intel(R) HD Graphics Skylake ULT GT2", { {"PAD_DIMX",16}, {"PAD_DIMY",8}, {"PAD_WPTX",4}, {"PAD_WPTY",4} } }, + { "default", { {"PAD_DIMX",16}, {"PAD_DIMY",8}, {"PAD_WPTX",4}, {"PAD_WPTY",4} } }, + } + }, + { // Default + kDeviceTypeAll, "default", { + { "default", { {"PAD_DIMX",16}, {"PAD_DIMY",8}, {"PAD_WPTX",4}, {"PAD_WPTY",4} } }, + } + }, + } +}; + +// ================================================================================================= + const Database::DatabaseEntry Database::PadSingle = { "Pad", Precision::kSingle, { { // AMD GPUs diff --git a/include/internal/database/padtranspose.h b/include/internal/database/padtranspose.h index b1db1b21..2d8d47f2 100644 --- a/include/internal/database/padtranspose.h +++ b/include/internal/database/padtranspose.h @@ -14,6 +14,24 @@ namespace clblast { // ================================================================================================= +const Database::DatabaseEntry Database::PadtransposeHalf = { + "Padtranspose", Precision::kHalf, { + { // Intel GPUs + kDeviceTypeGPU, "Intel", { + { "Intel(R) HD Graphics Skylake ULT GT2", { {"PADTRA_PAD",0}, {"PADTRA_TILE",8}, {"PADTRA_WPT",2} } }, + { "default", { {"PADTRA_PAD",0}, {"PADTRA_TILE",8}, {"PADTRA_WPT",2} } }, + } + }, + { // Default + kDeviceTypeAll, "default", { + { "default", { {"PADTRA_PAD",0}, {"PADTRA_TILE",8}, {"PADTRA_WPT",2} } }, + } + }, + } +}; + +// ================================================================================================= + const Database::DatabaseEntry Database::PadtransposeSingle = { "Padtranspose", Precision::kSingle, { { // AMD GPUs diff --git a/include/internal/database/transpose.h b/include/internal/database/transpose.h index d87f79a6..8e5ace67 100644 --- a/include/internal/database/transpose.h +++ b/include/internal/database/transpose.h @@ -14,6 +14,24 @@ namespace clblast { // ================================================================================================= +const Database::DatabaseEntry Database::TransposeHalf = { + "Transpose", Precision::kHalf, { + { // Intel GPUs + kDeviceTypeGPU, "Intel", { + { "Intel(R) HD Graphics Skylake ULT GT2", { {"TRA_DIM",8}, {"TRA_PAD",0}, {"TRA_SHUFFLE",1}, {"TRA_WPT",8} } }, + { "default", { {"TRA_DIM",8}, {"TRA_PAD",0}, {"TRA_SHUFFLE",1}, {"TRA_WPT",8} } }, + } + }, + { // Default + kDeviceTypeAll, "default", { + { "default", { {"TRA_DIM",8}, {"TRA_PAD",0}, {"TRA_SHUFFLE",1}, {"TRA_WPT",8} } }, + } + }, + } +}; + +// ================================================================================================= + const Database::DatabaseEntry Database::TransposeSingle = { "Transpose", Precision::kSingle, { { // AMD GPUs |