summaryrefslogtreecommitdiff
path: root/include/internal/database/transpose.h
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-05-16 12:45:10 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-05-16 12:45:10 +0200
commit7a3b695db70810595ae17d9d753c3b926aa738c0 (patch)
tree2ba239884a8f20e34449bee35bc96b94b84954eb /include/internal/database/transpose.h
parentaf2ac6221288ec101a69018e960bb004ad698efe (diff)
Added half precision tuning results for supporting kernels (pad, copy, transpose, padtranspose)
Diffstat (limited to 'include/internal/database/transpose.h')
-rw-r--r--include/internal/database/transpose.h18
1 files changed, 18 insertions, 0 deletions
diff --git a/include/internal/database/transpose.h b/include/internal/database/transpose.h
index d87f79a6..8e5ace67 100644
--- a/include/internal/database/transpose.h
+++ b/include/internal/database/transpose.h
@@ -14,6 +14,24 @@
namespace clblast {
// =================================================================================================
+const Database::DatabaseEntry Database::TransposeHalf = {
+ "Transpose", Precision::kHalf, {
+ { // Intel GPUs
+ kDeviceTypeGPU, "Intel", {
+ { "Intel(R) HD Graphics Skylake ULT GT2", { {"TRA_DIM",8}, {"TRA_PAD",0}, {"TRA_SHUFFLE",1}, {"TRA_WPT",8} } },
+ { "default", { {"TRA_DIM",8}, {"TRA_PAD",0}, {"TRA_SHUFFLE",1}, {"TRA_WPT",8} } },
+ }
+ },
+ { // Default
+ kDeviceTypeAll, "default", {
+ { "default", { {"TRA_DIM",8}, {"TRA_PAD",0}, {"TRA_SHUFFLE",1}, {"TRA_WPT",8} } },
+ }
+ },
+ }
+};
+
+// =================================================================================================
+
const Database::DatabaseEntry Database::TransposeSingle = {
"Transpose", Precision::kSingle, {
{ // AMD GPUs