summaryrefslogtreecommitdiff
path: root/include
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-12-28 14:46:45 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2017-12-28 14:46:45 +0100
commit6d1e30e61f5ef73f0a83e12f064cae64644034ca (patch)
treea8874ae7db89acbce71ccf2be560dd13309012b4 /include
parentaaea9474a154a9f07534523e4ca66e4b2c5f2d4f (diff)
Added interface to compute the required temporary buffer size for GEMM
Diffstat (limited to 'include')
-rw-r--r--include/clblast.h11
1 files changed, 11 insertions, 0 deletions
diff --git a/include/clblast.h b/include/clblast.h
index e073b211..3318768a 100644
--- a/include/clblast.h
+++ b/include/clblast.h
@@ -647,6 +647,17 @@ StatusCode GemmBatched(const Layout layout, const Transpose a_transpose, const T
// =================================================================================================
+// Retrieves the required size of the temporary buffer for the GEMM kernel (optional)
+template <typename T>
+StatusCode GemmTempBufferSize(const Layout layout, const Transpose a_transpose, const Transpose b_transpose,
+ const size_t m, const size_t n, const size_t k,
+ const size_t a_offset, const size_t a_ld,
+ const size_t b_offset, const size_t b_ld,
+ const size_t c_offset, const size_t c_ld,
+ cl_command_queue* queue, size_t& temp_buffer_size);
+
+// =================================================================================================
+
// CLBlast stores binaries of compiled kernels into a cache in case the same kernel is used later on
// for the same device. This cache can be cleared to free up system memory or in case of debugging.
StatusCode PUBLIC_API ClearCache();