From 3c9e63c0549870c6a1a8d019ec7cc2abee61601e Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sun, 22 May 2016 14:43:25 +0200 Subject: Added first tuning results for the half-precision xDOT kernels --- include/internal/database.h | 2 +- include/internal/database/xdot.h | 18 ++++++++++++++++++ 2 files changed, 19 insertions(+), 1 deletion(-) (limited to 'include') diff --git a/include/internal/database.h b/include/internal/database.h index f66edcac..d048e4f8 100644 --- a/include/internal/database.h +++ b/include/internal/database.h @@ -68,7 +68,7 @@ class Database { // The database consists of separate database entries, stored together in a vector static const DatabaseEntry XaxpyHalf, XaxpySingle, XaxpyDouble, XaxpyComplexSingle, XaxpyComplexDouble; - static const DatabaseEntry XdotSingle, XdotDouble, XdotComplexSingle, XdotComplexDouble; + static const DatabaseEntry XdotHalf, XdotSingle, XdotDouble, XdotComplexSingle, XdotComplexDouble; static const DatabaseEntry XgemvSingle, XgemvDouble, XgemvComplexSingle, XgemvComplexDouble; static const DatabaseEntry XgerSingle, XgerDouble, XgerComplexSingle, XgerComplexDouble; static const DatabaseEntry XgemmSingle, XgemmDouble, XgemmComplexSingle, XgemmComplexDouble; diff --git a/include/internal/database/xdot.h b/include/internal/database/xdot.h index f9ae975b..95def654 100644 --- a/include/internal/database/xdot.h +++ b/include/internal/database/xdot.h @@ -14,6 +14,24 @@ namespace clblast { // ================================================================================================= +const Database::DatabaseEntry Database::XdotHalf = { + "Xdot", Precision::kHalf, { + { // Intel GPUs + kDeviceTypeGPU, "Intel", { + { "Intel(R) HD Graphics Skylake ULT GT2", { {"WGS1",32}, {"WGS2",32} } }, + { "default", { {"WGS1",32}, {"WGS2",32} } }, + } + }, + { // Default + kDeviceTypeAll, "default", { + { "default", { {"WGS1",32}, {"WGS2",32} } }, + } + }, + } +}; + +// ================================================================================================= + const Database::DatabaseEntry Database::XdotSingle = { "Xdot", Precision::kSingle, { { // AMD GPUs -- cgit v1.2.3