summaryrefslogtreecommitdiff
path: root/include/clblast.h
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-04-29 23:33:12 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-04-29 23:33:12 +0200
commit877aad693f5bf57f8c37ded9e2acab014a4f039b (patch)
tree01ff55f48ed34164d19138c75fe47abeb14c5bb9 /include/clblast.h
parent4f528b1730df1ffda9d396030cfc4c4ddf0203fb (diff)
Added FillCache: a function to pre-compile all kernels for a specific device
Diffstat (limited to 'include/clblast.h')
-rw-r--r--include/clblast.h4
1 files changed, 4 insertions, 0 deletions
diff --git a/include/clblast.h b/include/clblast.h
index e473adbe..075ca93e 100644
--- a/include/clblast.h
+++ b/include/clblast.h
@@ -558,6 +558,10 @@ StatusCode Trsm(const Layout layout, const Side side, const Triangle triangle, c
// for the same device. This cache can be cleared to free up system memory or in case of debugging.
StatusCode ClearCache();
+// The cache can also be pre-initialized for a specific device with all possible CLBLast kernels.
+// Further CLBlast routine calls will then run at maximum speed.
+StatusCode FillCache(const cl_device_id device);
+
// =================================================================================================
} // namespace clblast