From 9fb6550dd02c54fafbb03e20516a394d9cd63f3f Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Thu, 22 Mar 2018 21:01:02 +0100 Subject: Added the OpenCL local memory size constraint to the tuners --- src/tuning/kernels/transpose_fast.cpp | 10 +++++----- 1 file changed, 5 insertions(+), 5 deletions(-) (limited to 'src/tuning/kernels/transpose_fast.cpp') diff --git a/src/tuning/kernels/transpose_fast.cpp b/src/tuning/kernels/transpose_fast.cpp index 6b37a31d..024f7385 100644 --- a/src/tuning/kernels/transpose_fast.cpp +++ b/src/tuning/kernels/transpose_fast.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeComputeLocalMemSize, clblast::TransposeSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeComputeLocalMemSize, clblast::TransposeSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeComputeLocalMemSize, clblast::TransposeSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeComputeLocalMemSize, clblast::TransposeSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeComputeLocalMemSize, clblast::TransposeSetArguments); break; } return 0; } -- cgit v1.2.3