summaryrefslogtreecommitdiff
path: root/src/tuning/kernels
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-10-01 13:45:08 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-10-01 13:45:08 +0200
commita9d35cf04ceb2ba2185c7520dbff79580abbd785 (patch)
treed12dabf8c65ee699a78cee8313ccb19377ab2832 /src/tuning/kernels
parent73d135c2cef9763b47d410b125eb8bb89ece8432 (diff)
parentd59e5c570b0bbdb8348d2f9ee6fc5850e606db27 (diff)
Merge branch 'development' into gemm_direct
Diffstat (limited to 'src/tuning/kernels')
-rw-r--r--src/tuning/kernels/xgemm.cpp6
1 files changed, 3 insertions, 3 deletions
diff --git a/src/tuning/kernels/xgemm.cpp b/src/tuning/kernels/xgemm.cpp
index 4cb7fd00..1abc5e8a 100644
--- a/src/tuning/kernels/xgemm.cpp
+++ b/src/tuning/kernels/xgemm.cpp
@@ -126,10 +126,10 @@ class TuneXgemm {
// Sets the local memory size
static void SetLocalMemorySize(cltune::Tuner &tuner, const size_t id, const Arguments<T> &args) {
auto LocalMemorySize = [args] (std::vector<size_t> v) {
- return (((v[0]*v[1]*v[2]/v[3]) + (v[4]*v[5]*v[6]/v[7]))*GetBytes(args.precision));
+ return (((v[0]*v[1]*v[2]) + (v[3]*v[4]*v[5]))*GetBytes(args.precision));
};
- tuner.SetLocalMemoryUsage(id, LocalMemorySize, {"SA", "KWG", "MWG", "VWM",
- "SB", "KWG", "NWG", "VWN"});
+ tuner.SetLocalMemoryUsage(id, LocalMemorySize, {"SA", "KWG", "MWG",
+ "SB", "KWG", "NWG"});
}
// Sets the base thread configuration