diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2018-04-15 11:45:45 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2018-04-15 11:45:45 +0200 |
commit | f14e6f87d2851936629071a2bb0c39d3a8b1a0e5 (patch) | |
tree | a79691a1e12f848360ab58381e2f2c844a26456c | |
parent | 0dff7f1ac43bb7d074db36ce2ce44c52e6760e7e (diff) |
Updated tuning results for the Skylake ULT GT2 GPU with the new kernel
-rw-r--r-- | CHANGELOG | 1 | ||||
-rwxr-xr-x | scripts/database/database.py | 1 | ||||
-rw-r--r-- | src/database/kernels/xgemm/xgemm_16.hpp | 4 | ||||
-rw-r--r-- | src/database/kernels/xgemm/xgemm_32.hpp | 2 | ||||
-rw-r--r-- | src/database/kernels/xgemm/xgemm_3232.hpp | 2 |
5 files changed, 6 insertions, 4 deletions
@@ -3,6 +3,7 @@ Development (next version) - Added Python interface to CLBlast 'PyCLBlast' - Added CLBlast to Ubuntu PPA and macOS Homebrew package managers - Added an API to run the tuners programmatically without any I/O +- Improved the performance potential by adding a second tunable GEMM kernel with 2D register tiling - Re-added a local memory size constraint to the tuners - Updated and reorganised the CLBlast documentation - Various minor fixes and enhancements diff --git a/scripts/database/database.py b/scripts/database/database.py index a2d9c6a0..6bd52760 100755 --- a/scripts/database/database.py +++ b/scripts/database/database.py @@ -147,6 +147,7 @@ def main(argv): if cl_args.remove_device is not None: print("[database] Removing all results for device '%s'" % cl_args.remove_device) remove_database_entries(database, {"clblast_device_name": cl_args.remove_device}) + #, "kernel_family": "xgemm"}) io.save_database(database, database_filename) # Adds new tuning parameters to existing database entries diff --git a/src/database/kernels/xgemm/xgemm_16.hpp b/src/database/kernels/xgemm/xgemm_16.hpp index f5fae792..26d2d985 100644 --- a/src/database/kernels/xgemm/xgemm_16.hpp +++ b/src/database/kernels/xgemm/xgemm_16.hpp @@ -36,8 +36,8 @@ const DatabaseEntry XgemmHalf = { kDeviceTypeGPU, "Intel", { { "default", { { Name{"Intel(R) HD Graphics 620 "}, Params{ 0, 1, 32, 2, 8, 8, 64, 8, 8, 64, 0, 0, 0, 0, 1, 1 } }, - { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 0, 1, 32, 2, 8, 16, 128, 8, 8, 32, 0, 1, 0, 1, 8, 4 } }, - { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 2 } }, + { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 0, 1, 16, 2, 8, 8, 32, 16, 16, 128, 0, 1, 1, 0, 4, 8 } }, + { kDeviceNameDefault , Params{ 0, 1, 32, 2, 8, 16, 128, 8, 8, 32, 0, 1, 0, 1, 8, 4 } }, } }, } }, diff --git a/src/database/kernels/xgemm/xgemm_32.hpp b/src/database/kernels/xgemm/xgemm_32.hpp index 05fa7e29..bc68555c 100644 --- a/src/database/kernels/xgemm/xgemm_32.hpp +++ b/src/database/kernels/xgemm/xgemm_32.hpp @@ -89,7 +89,7 @@ const DatabaseEntry XgemmSingle = { { Name{"Intel(R) HD Graphics 620 "}, Params{ 0, 1, 32, 2, 32, 8, 64, 16, 16, 128, 0, 0, 0, 1, 1, 2 } }, { Name{"Intel(R) HD Graphics Haswell Ultrabook GT2 Mobile "}, Params{ 0, 1, 16, 2, 16, 8, 32, 8, 16, 128, 1, 1, 1, 1, 2, 4 } }, { Name{"Intel(R) HD Graphics IvyBridge M GT2 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 16, 128, 1, 1, 0, 1, 1, 4 } }, - { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } }, + { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 1, 2, 1, 1, 4, 4, 32, 8, 8, 64, 0, 0, 0, 0, 2, 2 } }, { Name{"Iris "}, Params{ 0, 1, 16, 8, 16, 8, 128, 32, 16, 64, 1, 1, 1, 1, 4, 1 } }, { Name{"Iris Pro "}, Params{ 0, 1, 16, 2, 16, 8, 64, 32, 32, 128, 1, 1, 1, 0, 4, 4 } }, { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 8, 8, 64, 1, 1, 0, 0, 4, 4 } }, diff --git a/src/database/kernels/xgemm/xgemm_3232.hpp b/src/database/kernels/xgemm/xgemm_3232.hpp index bda4e07a..febca946 100644 --- a/src/database/kernels/xgemm/xgemm_3232.hpp +++ b/src/database/kernels/xgemm/xgemm_3232.hpp @@ -87,7 +87,7 @@ const DatabaseEntry XgemmComplexSingle = { { Name{"Intel(R) HD Graphics 5500 BroadWell U-Processor GT"}, Params{ 0, 1, 16, 8, 8, 8, 32, 16, 16, 64, 1, 0, 0, 0, 4, 4 } }, { Name{"Intel(R) HD Graphics 620 "}, Params{ 0, 1, 16, 2, 16, 8, 32, 8, 8, 32, 0, 0, 1, 0, 1, 1 } }, { Name{"Intel(R) HD Graphics Haswell Ultrabook GT2 Mobile "}, Params{ 0, 1, 32, 8, 16, 16, 64, 16, 16, 64, 1, 1, 1, 1, 2, 1 } }, - { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 0, 1, 32, 2, 16, 16, 64, 16, 16, 64, 0, 0, 0, 0, 4, 2 } }, + { Name{"Intel(R) HD Graphics Skylake ULT GT2 "}, Params{ 1, 2, 1, 1, 4, 4, 16, 8, 8, 64, 0, 0, 0, 0, 2, 2 } }, { Name{"Iris "}, Params{ 0, 1, 32, 8, 32, 16, 64, 8, 16, 64, 1, 0, 1, 0, 1, 1 } }, { Name{"Iris Pro "}, Params{ 0, 1, 16, 2, 8, 8, 32, 32, 8, 32, 1, 1, 1, 1, 1, 1 } }, { kDeviceNameDefault , Params{ 0, 1, 32, 2, 16, 16, 64, 32, 32, 128, 1, 1, 1, 0, 2, 2 } }, |