diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2017-11-07 22:20:13 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2017-11-07 22:20:13 +0100 |
commit | b18cc9d3f18accf88c9551c98c51b99add57b96c (patch) | |
tree | a9017ad18e161647b05ba6c597dfe8ae5125298b /CMakeLists.txt | |
parent | 061b1c571b86714f1d323563a9ac587a850ecddc (diff) | |
parent | 6fe9916231a0c6316e3427aaed3be281080a2692 (diff) |
Merge pull request #212 from CNugteren/kernel_selection_tuner
GEMM kernel selection tuner
Diffstat (limited to 'CMakeLists.txt')
-rw-r--r-- | CMakeLists.txt | 12 |
1 files changed, 10 insertions, 2 deletions
diff --git a/CMakeLists.txt b/CMakeLists.txt index 28093980..a97a4eb0 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -204,7 +204,9 @@ endif() set(KERNELS copy_fast copy_pad transpose_fast transpose_pad xaxpy xdot xger xgemm xgemm_direct xgemv) set(DATABASES copy pad padtranspose transpose xaxpy xdot - xgemm xgemm_direct xgemv xgemv_fast xgemv_fast_rot xger) + xgemm xgemm_direct xgemv xgemv_fast xgemv_fast_rot xger + gemm_routine) +set(ROUTINE_TUNERS xgemm) set(LEVEL1_ROUTINES xswap xscal xcopy xaxpy xdot xdotu xdotc xnrm2 xasum xamax) set(LEVEL2_ROUTINES xgemv xgbmv xhemv xhbmv xhpmv xsymv xsbmv xspmv xtrmv xtbmv xtpmv xtrsv xger xgeru xgerc xher xhpr xher2 xhpr2 xsyr xspr xsyr2 xspr2) @@ -243,7 +245,6 @@ set(HEADERS # such that they can be discovered by IDEs such as CLion and Visual src/database/apple_cpu_fallback.hpp src/database/database.hpp src/database/database_structure.hpp - src/database/kernel_selection.hpp src/routines/level1/xamin.hpp src/routines/level1/xmax.hpp src/routines/level1/xmin.hpp @@ -254,6 +255,7 @@ set(HEADERS # such that they can be discovered by IDEs such as CLion and Visual src/utilities/clblast_exceptions.hpp src/utilities/device_mapping.hpp src/utilities/msvc.hpp + src/utilities/timing.hpp src/utilities/utilities.hpp src/cache.hpp src/cxpp11_common.hpp @@ -388,6 +390,12 @@ if(TUNERS) target_include_directories(clblast_tuner_${KERNEL} PUBLIC ${CLTUNE_INCLUDE_DIRS}) install(TARGETS clblast_tuner_${KERNEL} DESTINATION bin) endforeach() + foreach(ROUTINE_TUNER ${ROUTINE_TUNERS}) + add_executable(clblast_tuner_routine_${ROUTINE_TUNER} ${TUNERS_COMMON} src/tuning/routines/${ROUTINE_TUNER}.cpp) + target_link_libraries(clblast_tuner_routine_${ROUTINE_TUNER} clblast ${CLTUNE_LIBRARIES} ${API_LIBRARIES}) + target_include_directories(clblast_tuner_routine_${ROUTINE_TUNER} PUBLIC ${CLTUNE_INCLUDE_DIRS}) + install(TARGETS clblast_tuner_routine_${ROUTINE_TUNER} DESTINATION bin) + endforeach() # Adds 'alltuners' target: runs all tuners for all precisions set(ALLTUNERS ) |