summaryrefslogtreecommitdiff
path: root/include/clblast_cuda.h
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2018-01-11 20:32:06 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2018-01-11 20:32:06 +0100
commita500f537d8281ad32e2eb07016b9de78c946ec50 (patch)
treedc5a06480fe1b6c3f4b9c65b8dd69e87ea65520a /include/clblast_cuda.h
parent389919faec965e81a0196bb8260c7a77926b4edc (diff)
Added a RetrieveParameters function to inspect tuning parameters
Diffstat (limited to 'include/clblast_cuda.h')
-rw-r--r--include/clblast_cuda.h5
1 files changed, 5 insertions, 0 deletions
diff --git a/include/clblast_cuda.h b/include/clblast_cuda.h
index b0cb9aa8..ed348efe 100644
--- a/include/clblast_cuda.h
+++ b/include/clblast_cuda.h
@@ -654,6 +654,11 @@ StatusCode PUBLIC_API FillCache(const CUdevice device);
// =================================================================================================
+// Retrieves current tuning parameters for a specific device-precision-kernel combination
+StatusCode PUBLIC_API RetrieveParameters(const CUdevice device, const std::string &kernel_name,
+ const Precision precision,
+ std::unordered_map<std::string,size_t> &parameters);
+
// Overrides tuning parameters for a specific device-precision-kernel combination. The next time
// the target routine is called it will re-compile and use the new parameters from then on.
StatusCode PUBLIC_API OverrideParameters(const CUdevice device, const std::string &kernel_name,