diff options
Diffstat (limited to 'include/clblast_c.h')
-rw-r--r-- | include/clblast_c.h | 32 |
1 files changed, 32 insertions, 0 deletions
diff --git a/include/clblast_c.h b/include/clblast_c.h index 12d03f81..f933ef6c 100644 --- a/include/clblast_c.h +++ b/include/clblast_c.h @@ -1327,6 +1327,38 @@ CLBlastStatusCode PUBLIC_API CLBlastHomatcopy(const CLBlastLayout layout, const cl_mem b_buffer, const size_t b_offset, const size_t b_ld, cl_command_queue* queue, cl_event* event); +// Batched version of AXPY: SAXPYBATCHED/DAXPYBATCHED/CAXPYBATCHED/ZAXPYBATCHED/HAXPYBATCHED +CLBlastStatusCode PUBLIC_API CLBlastSaxpyBatched(const size_t n, + const float *alphas, + const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc, + cl_mem *y_buffers, const size_t y_offset, const size_t y_inc, + const size_t batch_count, + cl_command_queue* queue, cl_event* event); +CLBlastStatusCode PUBLIC_API CLBlastDaxpyBatched(const size_t n, + const double *alphas, + const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc, + cl_mem *y_buffers, const size_t y_offset, const size_t y_inc, + const size_t batch_count, + cl_command_queue* queue, cl_event* event); +CLBlastStatusCode PUBLIC_API CLBlastCaxpyBatched(const size_t n, + const cl_float2 *alphas, + const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc, + cl_mem *y_buffers, const size_t y_offset, const size_t y_inc, + const size_t batch_count, + cl_command_queue* queue, cl_event* event); +CLBlastStatusCode PUBLIC_API CLBlastZaxpyBatched(const size_t n, + const cl_double2 *alphas, + const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc, + cl_mem *y_buffers, const size_t y_offset, const size_t y_inc, + const size_t batch_count, + cl_command_queue* queue, cl_event* event); +CLBlastStatusCode PUBLIC_API CLBlastHaxpyBatched(const size_t n, + const cl_half *alphas, + const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc, + cl_mem *y_buffers, const size_t y_offset, const size_t y_inc, + const size_t batch_count, + cl_command_queue* queue, cl_event* event); + // ================================================================================================= // CLBlast stores binaries of compiled kernels into a cache in case the same kernel is used later on |