diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2016-09-27 20:03:55 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2016-09-27 20:03:55 +0200 |
commit | adc058440c2f7b0f0a809158c7a612d9ddc0084c (patch) | |
tree | 9d3cd12857dd638660a79cb625d0b66b2659708b /src | |
parent | 6178fcd5847b0531a3290fc7c1737dea4eba524c (diff) |
Fixed the local memory size computation for the GEMM tuners
Diffstat (limited to 'src')
-rw-r--r-- | src/tuning/kernels/xgemm.cpp | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/src/tuning/kernels/xgemm.cpp b/src/tuning/kernels/xgemm.cpp index 4cb7fd00..1abc5e8a 100644 --- a/src/tuning/kernels/xgemm.cpp +++ b/src/tuning/kernels/xgemm.cpp @@ -126,10 +126,10 @@ class TuneXgemm { // Sets the local memory size static void SetLocalMemorySize(cltune::Tuner &tuner, const size_t id, const Arguments<T> &args) { auto LocalMemorySize = [args] (std::vector<size_t> v) { - return (((v[0]*v[1]*v[2]/v[3]) + (v[4]*v[5]*v[6]/v[7]))*GetBytes(args.precision)); + return (((v[0]*v[1]*v[2]) + (v[3]*v[4]*v[5]))*GetBytes(args.precision)); }; - tuner.SetLocalMemoryUsage(id, LocalMemorySize, {"SA", "KWG", "MWG", "VWM", - "SB", "KWG", "NWG", "VWN"}); + tuner.SetLocalMemoryUsage(id, LocalMemorySize, {"SA", "KWG", "MWG", + "SB", "KWG", "NWG"}); } // Sets the base thread configuration |