summaryrefslogtreecommitdiff
path: root/src
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2022-05-23 12:45:22 +0200
committerGitHub <noreply@github.com>2022-05-23 12:45:22 +0200
commit9ab1bf24e2c0107aa7fbc5018ea93f45c6408bb2 (patch)
tree82a42d54305d1fa8fe37c86196c293d53d0af9d4 /src
parent6b358e1be9c96d33d9fb28b24d82972c7dd7f41a (diff)
Fix API inconsistency in cupp11.hpp
The function `CopyToAsync` has an optional event argument in the OpenCL version, which is used in CLBlast. This makes the code not compile at all if CUDA (through cupp11.hpp`) is used as backend. This issue was found by a CLBlast user and reported privately by email. This PR should fix that.
Diffstat (limited to 'src')
-rw-r--r--src/cupp11.hpp3
1 files changed, 2 insertions, 1 deletions
diff --git a/src/cupp11.hpp b/src/cupp11.hpp
index ce765844..edcdc12f 100644
--- a/src/cupp11.hpp
+++ b/src/cupp11.hpp
@@ -647,7 +647,8 @@ public:
}
// Copies the contents of this buffer into another device buffer
- void CopyToAsync(const Queue &queue, const size_t size, const Buffer<T> &destination) const {
+ void CopyToAsync(const Queue &queue, const size_t size, const Buffer<T> &destination,
+ EventPointer event = nullptr) const {
CheckError(cuMemcpyDtoDAsync(destination(), *buffer_, size*sizeof(T), queue()));
}
void CopyTo(const Queue &queue, const size_t size, const Buffer<T> &destination) const {