summaryrefslogtreecommitdiff
path: root/src/clblast.cc
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-05-13 20:49:34 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-05-13 20:49:34 +0200
commit120c31a30f933eea12d4dfffd4951fa22102ef5f (patch)
tree853aa6fae0522c9e92fce266c5fddb12a19dafd3 /src/clblast.cc
parentf2ba75890c522b4fe1762bfeac3e08667cf9588a (diff)
Initial experimental version of the half-precision HAXPY routine
Diffstat (limited to 'src/clblast.cc')
-rw-r--r--src/clblast.cc7
1 files changed, 6 insertions, 1 deletions
diff --git a/src/clblast.cc b/src/clblast.cc
index 8a9465c3..c18dc0a9 100644
--- a/src/clblast.cc
+++ b/src/clblast.cc
@@ -253,7 +253,7 @@ template StatusCode PUBLIC_API Copy<double2>(const size_t,
cl_mem, const size_t, const size_t,
cl_command_queue*, cl_event*);
-// Vector-times-constant plus vector: SAXPY/DAXPY/CAXPY/ZAXPY
+// Vector-times-constant plus vector: SAXPY/DAXPY/CAXPY/ZAXPY/HAXPY
template <typename T>
StatusCode Axpy(const size_t n,
const T alpha,
@@ -289,6 +289,11 @@ template StatusCode PUBLIC_API Axpy<double2>(const size_t,
const cl_mem, const size_t, const size_t,
cl_mem, const size_t, const size_t,
cl_command_queue*, cl_event*);
+template StatusCode PUBLIC_API Axpy<half>(const size_t,
+ const half,
+ const cl_mem, const size_t, const size_t,
+ cl_mem, const size_t, const size_t,
+ cl_command_queue*, cl_event*);
// Dot product of two vectors: SDOT/DDOT
template <typename T>