summaryrefslogtreecommitdiff
path: root/include/clblast_c.h
diff options
context:
space:
mode:
Diffstat (limited to 'include/clblast_c.h')
-rw-r--r--include/clblast_c.h32
1 files changed, 32 insertions, 0 deletions
diff --git a/include/clblast_c.h b/include/clblast_c.h
index 12d03f81..f933ef6c 100644
--- a/include/clblast_c.h
+++ b/include/clblast_c.h
@@ -1327,6 +1327,38 @@ CLBlastStatusCode PUBLIC_API CLBlastHomatcopy(const CLBlastLayout layout, const
cl_mem b_buffer, const size_t b_offset, const size_t b_ld,
cl_command_queue* queue, cl_event* event);
+// Batched version of AXPY: SAXPYBATCHED/DAXPYBATCHED/CAXPYBATCHED/ZAXPYBATCHED/HAXPYBATCHED
+CLBlastStatusCode PUBLIC_API CLBlastSaxpyBatched(const size_t n,
+ const float *alphas,
+ const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc,
+ cl_mem *y_buffers, const size_t y_offset, const size_t y_inc,
+ const size_t batch_count,
+ cl_command_queue* queue, cl_event* event);
+CLBlastStatusCode PUBLIC_API CLBlastDaxpyBatched(const size_t n,
+ const double *alphas,
+ const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc,
+ cl_mem *y_buffers, const size_t y_offset, const size_t y_inc,
+ const size_t batch_count,
+ cl_command_queue* queue, cl_event* event);
+CLBlastStatusCode PUBLIC_API CLBlastCaxpyBatched(const size_t n,
+ const cl_float2 *alphas,
+ const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc,
+ cl_mem *y_buffers, const size_t y_offset, const size_t y_inc,
+ const size_t batch_count,
+ cl_command_queue* queue, cl_event* event);
+CLBlastStatusCode PUBLIC_API CLBlastZaxpyBatched(const size_t n,
+ const cl_double2 *alphas,
+ const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc,
+ cl_mem *y_buffers, const size_t y_offset, const size_t y_inc,
+ const size_t batch_count,
+ cl_command_queue* queue, cl_event* event);
+CLBlastStatusCode PUBLIC_API CLBlastHaxpyBatched(const size_t n,
+ const cl_half *alphas,
+ const cl_mem *x_buffers, const size_t x_offset, const size_t x_inc,
+ cl_mem *y_buffers, const size_t y_offset, const size_t y_inc,
+ const size_t batch_count,
+ cl_command_queue* queue, cl_event* event);
+
// =================================================================================================
// CLBlast stores binaries of compiled kernels into a cache in case the same kernel is used later on