diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2016-10-03 19:32:01 +0200 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2016-10-03 19:32:01 +0200 |
commit | c1c4bc5d209280e4ec9be5c0a26f7c94077a6b20 (patch) | |
tree | 8f5781b17e2b2d7b96bf8d9e593e1e471fc67a30 /src/routines/level3 | |
parent | 243cef73db53b5d8ce6c55f95e18c4412539d210 (diff) |
Re-organised GEMM direct kernel and added faster fall-back version for incomplete rectangles
Diffstat (limited to 'src/routines/level3')
-rw-r--r-- | src/routines/level3/xgemm.cpp | 1 |
1 files changed, 1 insertions, 0 deletions
diff --git a/src/routines/level3/xgemm.cpp b/src/routines/level3/xgemm.cpp index 143ef3c1..93f5d30c 100644 --- a/src/routines/level3/xgemm.cpp +++ b/src/routines/level3/xgemm.cpp @@ -38,6 +38,7 @@ Xgemm<T>::Xgemm(Queue &queue, EventPointer event, const std::string &name): #include "../../kernels/level3/xgemm_part3.opencl" #include "../../kernels/level3/xgemm_direct_part1.opencl" #include "../../kernels/level3/xgemm_direct_part2.opencl" + #include "../../kernels/level3/xgemm_direct_part3.opencl" ; } |