summaryrefslogtreecommitdiff
path: root/src/database/kernels/xgemv_fast_rot.hpp
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-09-12 20:13:38 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-09-12 20:13:38 +0200
commitaa3dffe356cc3c85e4d49508a4f21f4becba6e8c (patch)
treebe0853996d6d722206d678a86882d21d863cd5ab /src/database/kernels/xgemv_fast_rot.hpp
parentb5a67f86ecca72b47fc3d0a8231f902752b13c3d (diff)
Added XgemvFastRot and Xgemm 16-bit tuning results: just defaults which are now automatically taken from 32-bit if there are no entries at all
Diffstat (limited to 'src/database/kernels/xgemv_fast_rot.hpp')
-rw-r--r--src/database/kernels/xgemv_fast_rot.hpp12
1 files changed, 12 insertions, 0 deletions
diff --git a/src/database/kernels/xgemv_fast_rot.hpp b/src/database/kernels/xgemv_fast_rot.hpp
index 3d2e0d3a..328094e1 100644
--- a/src/database/kernels/xgemv_fast_rot.hpp
+++ b/src/database/kernels/xgemv_fast_rot.hpp
@@ -14,6 +14,18 @@
namespace clblast {
// =================================================================================================
+const Database::DatabaseEntry Database::XgemvFastRotHalf = {
+ "XgemvFastRot", Precision::kHalf, {
+ { // Default
+ kDeviceTypeAll, "default", {
+ { "default", { {"VW3",8}, {"WGS3",32}, {"WPT3",32} } },
+ }
+ },
+ }
+};
+
+// =================================================================================================
+
const Database::DatabaseEntry Database::XgemvFastRotSingle = {
"XgemvFastRot", Precision::kSingle, {
{ // AMD GPUs