From 0d13d814c21f1fdb3b0781b84bf12914aec5225a Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Thu, 14 Sep 2017 21:27:33 +0200 Subject: Added architecture layer in the tuning database for better performance on unseen devices --- src/database/kernels/xgemv_fast/xgemv_fast_16.hpp | 21 +++++++++++++++------ 1 file changed, 15 insertions(+), 6 deletions(-) (limited to 'src/database/kernels/xgemv_fast/xgemv_fast_16.hpp') diff --git a/src/database/kernels/xgemv_fast/xgemv_fast_16.hpp b/src/database/kernels/xgemv_fast/xgemv_fast_16.hpp index 6728e713..42a1e4ab 100644 --- a/src/database/kernels/xgemv_fast/xgemv_fast_16.hpp +++ b/src/database/kernels/xgemv_fast/xgemv_fast_16.hpp @@ -14,20 +14,29 @@ const DatabaseEntry XgemvFastHalf = { "XgemvFast", Precision::kHalf, {"VW2", "WGS2", "WPT2"}, { { // AMD GPUs kDeviceTypeGPU, "AMD", { - { "Ellesmere", { 1, 32, 1 } }, - { "default", { 1, 32, 1 } }, + { "Ellesmere", { + { "AMD Radeon RX 480", { 1, 32, 1 } }, + { "default", { 1, 32, 1 } }, + } }, + { "default", { + { "default", { 1, 32, 1 } }, + } }, } }, { // Intel GPUs kDeviceTypeGPU, "Intel", { - { "Intel(R) HD Graphics 5500 BroadWell U-Processor GT2", { 1, 16, 1 } }, - { "Intel(R) HD Graphics Skylake ULT GT2", { 4, 64, 4 } }, - { "default", { 1, 16, 1 } }, + { "default", { + { "Intel(R) HD Graphics 5500 BroadWell U-Processor GT2", { 1, 16, 1 } }, + { "Intel(R) HD Graphics Skylake ULT GT2", { 4, 64, 4 } }, + { "default", { 1, 16, 1 } }, + } }, } }, { // Default kDeviceTypeAll, "default", { - { "default", { 1, 16, 1 } }, + { "default", { + { "default", { 1, 16, 1 } }, + } }, } }, } -- cgit v1.2.3