summaryrefslogtreecommitdiff
path: root/src/tuning
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-04-14 20:16:10 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2017-04-14 20:16:10 +0200
commit10205d773e1477fdd634dbc7e224cc71361a9885 (patch)
treeda6ed72c7f530a02a9cae70938fce4b4670066b2 /src/tuning
parent0da1e380974007f69b827f6b10ef0243249d0c5e (diff)
Added a new Xaxpy kernel in between the regular and fast version in
Diffstat (limited to 'src/tuning')
-rw-r--r--src/tuning/kernels/xaxpy.cpp6
1 files changed, 3 insertions, 3 deletions
diff --git a/src/tuning/kernels/xaxpy.cpp b/src/tuning/kernels/xaxpy.cpp
index 23132c51..7984e184 100644
--- a/src/tuning/kernels/xaxpy.cpp
+++ b/src/tuning/kernels/xaxpy.cpp
@@ -27,7 +27,7 @@ class TuneXaxpy {
// The representative kernel and the source code
static std::string KernelFamily() { return "xaxpy"; }
- static std::string KernelName() { return "XaxpyFast"; }
+ static std::string KernelName() { return "XaxpyFastest"; }
static std::string GetSources() {
return
#include "../src/kernels/common.opencl"
@@ -42,7 +42,7 @@ class TuneXaxpy {
// Tests for valid arguments
static void TestValidArguments(const Arguments<T> &args) {
if (!IsMultiple(args.n, 64)) {
- throw std::runtime_error("'XaxpyFast' requires 'n' to be a multiple of WGS*WPT*VW");
+ throw std::runtime_error("'XaxpyFastest' requires 'n' to be a multiple of WGS*WPT*VW");
}
}
@@ -52,7 +52,7 @@ class TuneXaxpy {
static size_t DefaultK() { return 1; } // N/A for this kernel
static size_t DefaultBatchCount() { return 1; } // N/A for this kernel
static double DefaultFraction() { return 1.0; } // N/A for this kernel
- static size_t DefaultNumRuns() { return 2; } // run every kernel this many times for averaging
+ static size_t DefaultNumRuns() { return 10; } // run every kernel this many times for averaging
// Describes how to obtain the sizes of the buffers
static size_t GetSizeX(const Arguments<T> &args) { return args.n; }