summaryrefslogtreecommitdiff
path: root/include/clblast.h
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2018-03-06 20:52:12 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2018-03-06 20:52:12 +0100
commit0e1a1520233934e1d11bf2c32fc909617ff751ac (patch)
tree6cf9505552515a604ca06b7dff99dd980a3a33ef /include/clblast.h
parenta1cedf36e357f0ce19eba67e1e031c3fd2647fae (diff)
First version of the tuning API, added interface for copy-kernel, added sample
Diffstat (limited to 'include/clblast.h')
-rw-r--r--include/clblast.h6
1 files changed, 6 insertions, 0 deletions
diff --git a/include/clblast.h b/include/clblast.h
index 9d3b9ea0..d6118e19 100644
--- a/include/clblast.h
+++ b/include/clblast.h
@@ -705,6 +705,12 @@ StatusCode PUBLIC_API OverrideParameters(const cl_device_id device, const std::s
// =================================================================================================
+template <typename T>
+StatusCode PUBLIC_API TuneCopyMatrixFast(cl_command_queue* queue, const size_t m, const size_t n,
+ const double fraction, std::unordered_map<std::string,size_t> &parameters);
+
+// =================================================================================================
+
} // namespace clblast
// CLBLAST_CLBLAST_H_