diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2017-12-28 14:46:45 +0100 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2017-12-28 14:46:45 +0100 |
commit | 6d1e30e61f5ef73f0a83e12f064cae64644034ca (patch) | |
tree | a8874ae7db89acbce71ccf2be560dd13309012b4 /include | |
parent | aaea9474a154a9f07534523e4ca66e4b2c5f2d4f (diff) |
Added interface to compute the required temporary buffer size for GEMM
Diffstat (limited to 'include')
-rw-r--r-- | include/clblast.h | 11 |
1 files changed, 11 insertions, 0 deletions
diff --git a/include/clblast.h b/include/clblast.h index e073b211..3318768a 100644 --- a/include/clblast.h +++ b/include/clblast.h @@ -647,6 +647,17 @@ StatusCode GemmBatched(const Layout layout, const Transpose a_transpose, const T // ================================================================================================= +// Retrieves the required size of the temporary buffer for the GEMM kernel (optional) +template <typename T> +StatusCode GemmTempBufferSize(const Layout layout, const Transpose a_transpose, const Transpose b_transpose, + const size_t m, const size_t n, const size_t k, + const size_t a_offset, const size_t a_ld, + const size_t b_offset, const size_t b_ld, + const size_t c_offset, const size_t c_ld, + cl_command_queue* queue, size_t& temp_buffer_size); + +// ================================================================================================= + // CLBlast stores binaries of compiled kernels into a cache in case the same kernel is used later on // for the same device. This cache can be cleared to free up system memory or in case of debugging. StatusCode PUBLIC_API ClearCache(); |