diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2016-05-13 20:49:34 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2016-05-13 20:49:34 +0200 |
commit | 120c31a30f933eea12d4dfffd4951fa22102ef5f (patch) | |
tree | 853aa6fae0522c9e92fce266c5fddb12a19dafd3 /src/clblast.cc | |
parent | f2ba75890c522b4fe1762bfeac3e08667cf9588a (diff) |
Initial experimental version of the half-precision HAXPY routine
Diffstat (limited to 'src/clblast.cc')
-rw-r--r-- | src/clblast.cc | 7 |
1 files changed, 6 insertions, 1 deletions
diff --git a/src/clblast.cc b/src/clblast.cc index 8a9465c3..c18dc0a9 100644 --- a/src/clblast.cc +++ b/src/clblast.cc @@ -253,7 +253,7 @@ template StatusCode PUBLIC_API Copy<double2>(const size_t, cl_mem, const size_t, const size_t, cl_command_queue*, cl_event*); -// Vector-times-constant plus vector: SAXPY/DAXPY/CAXPY/ZAXPY +// Vector-times-constant plus vector: SAXPY/DAXPY/CAXPY/ZAXPY/HAXPY template <typename T> StatusCode Axpy(const size_t n, const T alpha, @@ -289,6 +289,11 @@ template StatusCode PUBLIC_API Axpy<double2>(const size_t, const cl_mem, const size_t, const size_t, cl_mem, const size_t, const size_t, cl_command_queue*, cl_event*); +template StatusCode PUBLIC_API Axpy<half>(const size_t, + const half, + const cl_mem, const size_t, const size_t, + cl_mem, const size_t, const size_t, + cl_command_queue*, cl_event*); // Dot product of two vectors: SDOT/DDOT template <typename T> |