summaryrefslogtreecommitdiff
path: root/src/routines/level3
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2016-10-03 19:32:01 +0200
committerCedric Nugteren <web@cedricnugteren.nl>2016-10-03 19:32:01 +0200
commitc1c4bc5d209280e4ec9be5c0a26f7c94077a6b20 (patch)
tree8f5781b17e2b2d7b96bf8d9e593e1e471fc67a30 /src/routines/level3
parent243cef73db53b5d8ce6c55f95e18c4412539d210 (diff)
Re-organised GEMM direct kernel and added faster fall-back version for incomplete rectangles
Diffstat (limited to 'src/routines/level3')
-rw-r--r--src/routines/level3/xgemm.cpp1
1 files changed, 1 insertions, 0 deletions
diff --git a/src/routines/level3/xgemm.cpp b/src/routines/level3/xgemm.cpp
index 143ef3c1..93f5d30c 100644
--- a/src/routines/level3/xgemm.cpp
+++ b/src/routines/level3/xgemm.cpp
@@ -38,6 +38,7 @@ Xgemm<T>::Xgemm(Queue &queue, EventPointer event, const std::string &name):
#include "../../kernels/level3/xgemm_part3.opencl"
#include "../../kernels/level3/xgemm_direct_part1.opencl"
#include "../../kernels/level3/xgemm_direct_part2.opencl"
+ #include "../../kernels/level3/xgemm_direct_part3.opencl"
;
}