From 3d2ef9331bd01bfc31d6725576c8ccb4eadbbc1c Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sat, 10 Mar 2018 14:35:11 +0100 Subject: Fixed a few things for the new tuning API --- src/tuning/kernels/copy_fast.cpp | 10 +++++----- src/tuning/kernels/copy_fast.hpp | 10 +++++----- src/tuning/kernels/copy_pad.cpp | 10 +++++----- src/tuning/kernels/copy_pad.hpp | 10 +++++----- src/tuning/kernels/invert.cpp | 10 +++++----- src/tuning/kernels/invert.hpp | 10 +++++----- src/tuning/kernels/transpose_fast.cpp | 10 +++++----- src/tuning/kernels/transpose_fast.hpp | 10 +++++----- src/tuning/kernels/transpose_pad.cpp | 10 +++++----- src/tuning/kernels/transpose_pad.hpp | 10 +++++----- src/tuning/kernels/xaxpy.cpp | 10 +++++----- src/tuning/kernels/xaxpy.hpp | 10 +++++----- src/tuning/kernels/xdot.cpp | 10 +++++----- src/tuning/kernels/xdot.hpp | 10 +++++----- src/tuning/kernels/xgemm.cpp | 10 +++++----- src/tuning/kernels/xgemm.hpp | 10 +++++----- src/tuning/kernels/xgemm_direct.cpp | 10 +++++----- src/tuning/kernels/xgemm_direct.hpp | 10 +++++----- src/tuning/kernels/xgemv.cpp | 10 +++++----- src/tuning/kernels/xgemv.hpp | 10 +++++----- src/tuning/kernels/xger.cpp | 10 +++++----- src/tuning/kernels/xger.hpp | 10 +++++----- 22 files changed, 110 insertions(+), 110 deletions(-) (limited to 'src/tuning/kernels') diff --git a/src/tuning/kernels/copy_fast.cpp b/src/tuning/kernels/copy_fast.cpp index a71dd083..0314113c 100644 --- a/src/tuning/kernels/copy_fast.cpp +++ b/src/tuning/kernels/copy_fast.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::CopyGetTunerDefaults, clblast::CopyGetTunerSettings, clblast::CopyTestValidArguments, clblast::CopySetConstraints, clblast::CopySetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::CopyGetTunerDefaults, clblast::CopyGetTunerSettings, clblast::CopyTestValidArguments, clblast::CopySetConstraints, clblast::CopySetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::CopyGetTunerDefaults, clblast::CopyGetTunerSettings, clblast::CopyTestValidArguments, clblast::CopySetConstraints, clblast::CopySetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::CopyGetTunerDefaults, clblast::CopyGetTunerSettings, clblast::CopyTestValidArguments, clblast::CopySetConstraints, clblast::CopySetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::CopyGetTunerDefaults, clblast::CopyGetTunerSettings, clblast::CopyTestValidArguments, clblast::CopySetConstraints, clblast::CopySetArguments); break; } return 0; } diff --git a/src/tuning/kernels/copy_fast.hpp b/src/tuning/kernels/copy_fast.hpp index eab1c7dd..f9a58bc7 100644 --- a/src/tuning/kernels/copy_fast.hpp +++ b/src/tuning/kernels/copy_fast.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults CopyGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgAlpha}; settings.default_m = 1024; @@ -31,7 +31,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings CopyGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -77,12 +77,12 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int) { return {}; } +void CopyTestValidArguments(const int, const Arguments &) { } +std::vector CopySetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void CopySetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, buffers[2]()); // 2 == A matrix kernel.SetArgument(2, buffers[3]()); // 3 == B matrix diff --git a/src/tuning/kernels/copy_pad.cpp b/src/tuning/kernels/copy_pad.cpp index e32a5746..909a71c8 100644 --- a/src/tuning/kernels/copy_pad.cpp +++ b/src/tuning/kernels/copy_pad.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::PadGetTunerDefaults, clblast::PadGetTunerSettings, clblast::PadTestValidArguments, clblast::PadSetConstraints, clblast::PadSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::PadGetTunerDefaults, clblast::PadGetTunerSettings, clblast::PadTestValidArguments, clblast::PadSetConstraints, clblast::PadSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::PadGetTunerDefaults, clblast::PadGetTunerSettings, clblast::PadTestValidArguments, clblast::PadSetConstraints, clblast::PadSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::PadGetTunerDefaults, clblast::PadGetTunerSettings, clblast::PadTestValidArguments, clblast::PadSetConstraints, clblast::PadSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::PadGetTunerDefaults, clblast::PadGetTunerSettings, clblast::PadTestValidArguments, clblast::PadSetConstraints, clblast::PadSetArguments); break; } return 0; } diff --git a/src/tuning/kernels/copy_pad.hpp b/src/tuning/kernels/copy_pad.hpp index b39c0318..e612ca9e 100644 --- a/src/tuning/kernels/copy_pad.hpp +++ b/src/tuning/kernels/copy_pad.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults PadGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgAlpha}; settings.default_m = 1024; @@ -31,7 +31,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings PadGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -77,12 +77,12 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int) { return {}; } +void PadTestValidArguments(const int, const Arguments &) { } +std::vector PadSetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void PadSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, static_cast(args.n)); kernel.SetArgument(2, static_cast(args.m)); diff --git a/src/tuning/kernels/invert.cpp b/src/tuning/kernels/invert.cpp index ecd51199..3dfeb508 100644 --- a/src/tuning/kernels/invert.cpp +++ b/src/tuning/kernels/invert.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::InvertGetTunerDefaults, clblast::InvertGetTunerSettings, clblast::InvertTestValidArguments, clblast::InvertSetConstraints, clblast::InvertSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::InvertGetTunerDefaults, clblast::InvertGetTunerSettings, clblast::InvertTestValidArguments, clblast::InvertSetConstraints, clblast::InvertSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::InvertGetTunerDefaults, clblast::InvertGetTunerSettings, clblast::InvertTestValidArguments, clblast::InvertSetConstraints, clblast::InvertSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::InvertGetTunerDefaults, clblast::InvertGetTunerSettings, clblast::InvertTestValidArguments, clblast::InvertSetConstraints, clblast::InvertSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::InvertGetTunerDefaults, clblast::InvertGetTunerSettings, clblast::InvertTestValidArguments, clblast::InvertSetConstraints, clblast::InvertSetArguments); break; } return 0; } diff --git a/src/tuning/kernels/invert.hpp b/src/tuning/kernels/invert.hpp index 0178a2aa..0a0c9ce2 100644 --- a/src/tuning/kernels/invert.hpp +++ b/src/tuning/kernels/invert.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults InvertGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgN, kArgM, kArgK}; settings.default_n = 128; // dimension of input matrix 'n' @@ -32,7 +32,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings InvertGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -81,16 +81,16 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &args) { +void InvertTestValidArguments(const int, const Arguments &args) { if (!(args.k == 16)) { throw std::runtime_error("'TripleMatMul16Part1Lower' requires 'k' to be 16"); } } -std::vector SetConstraints(const int) { return {}; } +std::vector InvertSetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void InvertSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { const auto num_pages = CeilDiv(args.n, args.k * 2); // CeilDiv(n, current_size*2) kernel.SetArgument(0, static_cast(args.n)); // n kernel.SetArgument(1, buffers[2]()); // 2 == A matrix diff --git a/src/tuning/kernels/transpose_fast.cpp b/src/tuning/kernels/transpose_fast.cpp index 2144f23f..6b37a31d 100644 --- a/src/tuning/kernels/transpose_fast.cpp +++ b/src/tuning/kernels/transpose_fast.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::TransposeGetTunerDefaults, clblast::TransposeGetTunerSettings, clblast::TransposeTestValidArguments, clblast::TransposeSetConstraints, clblast::TransposeSetArguments); break; } return 0; } diff --git a/src/tuning/kernels/transpose_fast.hpp b/src/tuning/kernels/transpose_fast.hpp index 47859f7a..e8917ad2 100644 --- a/src/tuning/kernels/transpose_fast.hpp +++ b/src/tuning/kernels/transpose_fast.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults TransposeGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgAlpha}; settings.default_m = 1024; @@ -31,7 +31,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings TransposeGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -77,12 +77,12 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int) { return {}; } +void TransposeTestValidArguments(const int, const Arguments &) { } +std::vector TransposeSetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void TransposeSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, buffers[2]()); // 2 == A matrix kernel.SetArgument(2, buffers[3]()); // 3 == B matrix diff --git a/src/tuning/kernels/transpose_pad.cpp b/src/tuning/kernels/transpose_pad.cpp index ce39d857..fc7244f6 100644 --- a/src/tuning/kernels/transpose_pad.cpp +++ b/src/tuning/kernels/transpose_pad.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::PadtransposeGetTunerDefaults, clblast::PadtransposeGetTunerSettings, clblast::PadtransposeTestValidArguments, clblast::PadtransposeSetConstraints, clblast::PadtransposeSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::PadtransposeGetTunerDefaults, clblast::PadtransposeGetTunerSettings, clblast::PadtransposeTestValidArguments, clblast::PadtransposeSetConstraints, clblast::PadtransposeSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::PadtransposeGetTunerDefaults, clblast::PadtransposeGetTunerSettings, clblast::PadtransposeTestValidArguments, clblast::PadtransposeSetConstraints, clblast::PadtransposeSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::PadtransposeGetTunerDefaults, clblast::PadtransposeGetTunerSettings, clblast::PadtransposeTestValidArguments, clblast::PadtransposeSetConstraints, clblast::PadtransposeSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::PadtransposeGetTunerDefaults, clblast::PadtransposeGetTunerSettings, clblast::PadtransposeTestValidArguments, clblast::PadtransposeSetConstraints, clblast::PadtransposeSetArguments); break; } return 0; } diff --git a/src/tuning/kernels/transpose_pad.hpp b/src/tuning/kernels/transpose_pad.hpp index c9ce983e..8d24a0dc 100644 --- a/src/tuning/kernels/transpose_pad.hpp +++ b/src/tuning/kernels/transpose_pad.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults PadtransposeGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgAlpha}; settings.default_m = 1024; @@ -31,7 +31,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings PadtransposeGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -76,12 +76,12 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int) { return {}; } +void PadtransposeTestValidArguments(const int, const Arguments &) { } +std::vector PadtransposeSetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void PadtransposeSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, static_cast(args.n)); kernel.SetArgument(2, static_cast(args.m)); diff --git a/src/tuning/kernels/xaxpy.cpp b/src/tuning/kernels/xaxpy.cpp index a290b6c1..6a95600d 100644 --- a/src/tuning/kernels/xaxpy.cpp +++ b/src/tuning/kernels/xaxpy.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::XaxpyGetTunerDefaults, clblast::XaxpyGetTunerSettings, clblast::XaxpyTestValidArguments, clblast::XaxpySetConstraints, clblast::XaxpySetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::XaxpyGetTunerDefaults, clblast::XaxpyGetTunerSettings, clblast::XaxpyTestValidArguments, clblast::XaxpySetConstraints, clblast::XaxpySetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::XaxpyGetTunerDefaults, clblast::XaxpyGetTunerSettings, clblast::XaxpyTestValidArguments, clblast::XaxpySetConstraints, clblast::XaxpySetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::XaxpyGetTunerDefaults, clblast::XaxpyGetTunerSettings, clblast::XaxpyTestValidArguments, clblast::XaxpySetConstraints, clblast::XaxpySetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::XaxpyGetTunerDefaults, clblast::XaxpyGetTunerSettings, clblast::XaxpyTestValidArguments, clblast::XaxpySetConstraints, clblast::XaxpySetArguments); break; } return 0; } diff --git a/src/tuning/kernels/xaxpy.hpp b/src/tuning/kernels/xaxpy.hpp index 266a671b..24550ed9 100644 --- a/src/tuning/kernels/xaxpy.hpp +++ b/src/tuning/kernels/xaxpy.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults XaxpyGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgN, kArgAlpha}; settings.default_n = 4096*1024; @@ -30,7 +30,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings XaxpyGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -75,16 +75,16 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &args) { +void XaxpyTestValidArguments(const int, const Arguments &args) { if (!IsMultiple(args.n, 64)) { throw std::runtime_error("'XaxpyFastest' requires 'n' to be a multiple of WGS*WPT*VW"); } } -std::vector SetConstraints(const int) { return {}; } +std::vector XaxpySetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void XaxpySetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.n)); kernel.SetArgument(1, GetRealArg(args.alpha)); kernel.SetArgument(2, buffers[0]()); // 0 == X vector diff --git a/src/tuning/kernels/xdot.cpp b/src/tuning/kernels/xdot.cpp index 10126392..6d10c4d8 100644 --- a/src/tuning/kernels/xdot.cpp +++ b/src/tuning/kernels/xdot.cpp @@ -24,11 +24,11 @@ template void StartVariation(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::XdotGetTunerDefaults, clblast::XdotGetTunerSettings, clblast::XdotTestValidArguments, clblast::XdotSetConstraints, clblast::XdotSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::XdotGetTunerDefaults, clblast::XdotGetTunerSettings, clblast::XdotTestValidArguments, clblast::XdotSetConstraints, clblast::XdotSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::XdotGetTunerDefaults, clblast::XdotGetTunerSettings, clblast::XdotTestValidArguments, clblast::XdotSetConstraints, clblast::XdotSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::XdotGetTunerDefaults, clblast::XdotGetTunerSettings, clblast::XdotTestValidArguments, clblast::XdotSetConstraints, clblast::XdotSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::XdotGetTunerDefaults, clblast::XdotGetTunerSettings, clblast::XdotTestValidArguments, clblast::XdotSetConstraints, clblast::XdotSetArguments); break; } } diff --git a/src/tuning/kernels/xdot.hpp b/src/tuning/kernels/xdot.hpp index 456baea4..15673c79 100644 --- a/src/tuning/kernels/xdot.hpp +++ b/src/tuning/kernels/xdot.hpp @@ -22,7 +22,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults XdotGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgN}; settings.default_n = 2*1024*1024; @@ -31,7 +31,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int V, const Arguments &args) { +TunerSettings XdotGetTunerSettings(const int V, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -74,12 +74,12 @@ TunerSettings GetTunerSettings(const int V, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int) { return {}; } +void XdotTestValidArguments(const int, const Arguments &) { } +std::vector XdotSetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int V, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void XdotSetArguments(const int V, Kernel &kernel, const Arguments &args, std::vector>& buffers) { if (V == 1) { kernel.SetArgument(0, static_cast(args.n)); kernel.SetArgument(1, buffers[0]()); // 0 == X vector diff --git a/src/tuning/kernels/xgemm.cpp b/src/tuning/kernels/xgemm.cpp index f388c76c..d365ce6d 100644 --- a/src/tuning/kernels/xgemm.cpp +++ b/src/tuning/kernels/xgemm.cpp @@ -23,11 +23,11 @@ template void StartVariation(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::XgemmGetTunerDefaults, clblast::XgemmGetTunerSettings, clblast::XgemmTestValidArguments, clblast::XgemmSetConstraints, clblast::XgemmSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::XgemmGetTunerDefaults, clblast::XgemmGetTunerSettings, clblast::XgemmTestValidArguments, clblast::XgemmSetConstraints, clblast::XgemmSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::XgemmGetTunerDefaults, clblast::XgemmGetTunerSettings, clblast::XgemmTestValidArguments, clblast::XgemmSetConstraints, clblast::XgemmSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::XgemmGetTunerDefaults, clblast::XgemmGetTunerSettings, clblast::XgemmTestValidArguments, clblast::XgemmSetConstraints, clblast::XgemmSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::XgemmGetTunerDefaults, clblast::XgemmGetTunerSettings, clblast::XgemmTestValidArguments, clblast::XgemmSetConstraints, clblast::XgemmSetArguments); break; } } diff --git a/src/tuning/kernels/xgemm.hpp b/src/tuning/kernels/xgemm.hpp index 09ebe91d..66e197e1 100644 --- a/src/tuning/kernels/xgemm.hpp +++ b/src/tuning/kernels/xgemm.hpp @@ -23,7 +23,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int V) { +TunerDefaults XgemmGetTunerDefaults(const int V) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgK, kArgAlpha, kArgBeta, kArgFraction, kArgHeuristicSelection, kArgPsoSwarmSize, @@ -38,7 +38,7 @@ TunerDefaults GetTunerDefaults(const int V) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int V, const Arguments &args) { +TunerSettings XgemmGetTunerSettings(const int V, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -118,8 +118,8 @@ TunerSettings GetTunerSettings(const int V, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int V) { +void XgemmTestValidArguments(const int, const Arguments &) { } +std::vector XgemmSetConstraints(const int V) { auto constraints = std::vector(); auto MultipleOfX = [] (std::vector v) { return IsMultiple(v[0], v[1]); }; auto MultipleOfXMulY = [] (std::vector v) { return IsMultiple(v[0], v[1]*v[2]); }; @@ -148,7 +148,7 @@ std::vector SetConstraints(const int V) { // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void XgemmSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, static_cast(args.n)); kernel.SetArgument(2, static_cast(args.k)); diff --git a/src/tuning/kernels/xgemm_direct.cpp b/src/tuning/kernels/xgemm_direct.cpp index b059ad62..7298a6c3 100644 --- a/src/tuning/kernels/xgemm_direct.cpp +++ b/src/tuning/kernels/xgemm_direct.cpp @@ -23,11 +23,11 @@ template void StartVariation(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::XgemmDirectGetTunerDefaults, clblast::XgemmDirectGetTunerSettings, clblast::XgemmDirectTestValidArguments, clblast::XgemmDirectSetConstraints, clblast::XgemmDirectSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::XgemmDirectGetTunerDefaults, clblast::XgemmDirectGetTunerSettings, clblast::XgemmDirectTestValidArguments, clblast::XgemmDirectSetConstraints, clblast::XgemmDirectSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::XgemmDirectGetTunerDefaults, clblast::XgemmDirectGetTunerSettings, clblast::XgemmDirectTestValidArguments, clblast::XgemmDirectSetConstraints, clblast::XgemmDirectSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::XgemmDirectGetTunerDefaults, clblast::XgemmDirectGetTunerSettings, clblast::XgemmDirectTestValidArguments, clblast::XgemmDirectSetConstraints, clblast::XgemmDirectSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::XgemmDirectGetTunerDefaults, clblast::XgemmDirectGetTunerSettings, clblast::XgemmDirectTestValidArguments, clblast::XgemmDirectSetConstraints, clblast::XgemmDirectSetArguments); break; } } diff --git a/src/tuning/kernels/xgemm_direct.hpp b/src/tuning/kernels/xgemm_direct.hpp index 7cc9f654..ecb10bc6 100644 --- a/src/tuning/kernels/xgemm_direct.hpp +++ b/src/tuning/kernels/xgemm_direct.hpp @@ -23,7 +23,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int V) { +TunerDefaults XgemmDirectGetTunerDefaults(const int V) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgK, kArgAlpha, kArgBeta, kArgFraction, kArgHeuristicSelection, kArgPsoSwarmSize, @@ -38,7 +38,7 @@ TunerDefaults GetTunerDefaults(const int V) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int V, const Arguments &args) { +TunerSettings XgemmDirectGetTunerSettings(const int V, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -109,8 +109,8 @@ TunerSettings GetTunerSettings(const int V, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int V) { +void XgemmDirectTestValidArguments(const int, const Arguments &) { } +std::vector XgemmDirectSetConstraints(const int V) { auto constraints = std::vector(); auto MultipleOfX = [] (std::vector v) { return IsMultiple(v[0], v[1]); }; auto MultipleOfXMulY = [] (std::vector v) { return IsMultiple(v[0], v[1]*v[2]); }; @@ -138,7 +138,7 @@ std::vector SetConstraints(const int V) { // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void XgemmDirectSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, static_cast(args.n)); kernel.SetArgument(2, static_cast(args.k)); diff --git a/src/tuning/kernels/xgemv.cpp b/src/tuning/kernels/xgemv.cpp index 165c5628..9e45d73f 100644 --- a/src/tuning/kernels/xgemv.cpp +++ b/src/tuning/kernels/xgemv.cpp @@ -23,11 +23,11 @@ template void StartVariation(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, V, clblast::XgemvGetTunerDefaults, clblast::XgemvGetTunerSettings, clblast::XgemvTestValidArguments, clblast::XgemvSetConstraints, clblast::XgemvSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, V, clblast::XgemvGetTunerDefaults, clblast::XgemvGetTunerSettings, clblast::XgemvTestValidArguments, clblast::XgemvSetConstraints, clblast::XgemvSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, V, clblast::XgemvGetTunerDefaults, clblast::XgemvGetTunerSettings, clblast::XgemvTestValidArguments, clblast::XgemvSetConstraints, clblast::XgemvSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, V, clblast::XgemvGetTunerDefaults, clblast::XgemvGetTunerSettings, clblast::XgemvTestValidArguments, clblast::XgemvSetConstraints, clblast::XgemvSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, V, clblast::XgemvGetTunerDefaults, clblast::XgemvGetTunerSettings, clblast::XgemvTestValidArguments, clblast::XgemvSetConstraints, clblast::XgemvSetArguments); break; } } diff --git a/src/tuning/kernels/xgemv.hpp b/src/tuning/kernels/xgemv.hpp index 87186195..e44efe32 100644 --- a/src/tuning/kernels/xgemv.hpp +++ b/src/tuning/kernels/xgemv.hpp @@ -24,7 +24,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults XgemvGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgAlpha, kArgBeta}; settings.default_m = 2048; @@ -35,7 +35,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int V, const Arguments &args) { +TunerSettings XgemvGetTunerSettings(const int V, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -96,8 +96,8 @@ TunerSettings GetTunerSettings(const int V, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int V) { +void XgemvTestValidArguments(const int, const Arguments &) { } +std::vector XgemvSetConstraints(const int V) { auto constraints = std::vector(); if (V==2 || V==3) { auto MultipleOfX = [] (std::vector v) { return IsMultiple(v[0], v[1]); }; @@ -112,7 +112,7 @@ std::vector SetConstraints(const int V) { // Sets the kernel's arguments template -void SetArguments(const int V, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void XgemvSetArguments(const int V, Kernel &kernel, const Arguments &args, std::vector>& buffers) { auto a_rotated = (V==3) ? 1 : 0; kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, static_cast(args.n)); diff --git a/src/tuning/kernels/xger.cpp b/src/tuning/kernels/xger.cpp index 8a90f340..6dfc9ffa 100644 --- a/src/tuning/kernels/xger.cpp +++ b/src/tuning/kernels/xger.cpp @@ -22,11 +22,11 @@ using double2 = clblast::double2; int main(int argc, char *argv[]) { const auto command_line_args = clblast::RetrieveCommandLineArguments(argc, argv); switch(clblast::GetPrecision(command_line_args)) { - case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; - case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::GetTunerDefaults, clblast::GetTunerSettings, clblast::TestValidArguments, clblast::SetConstraints, clblast::SetArguments); break; + case clblast::Precision::kHalf: clblast::Tuner(argc, argv, 0, clblast::XgerGetTunerDefaults, clblast::XgerGetTunerSettings, clblast::XgerTestValidArguments, clblast::XgerSetConstraints, clblast::XgerSetArguments); break; + case clblast::Precision::kSingle: clblast::Tuner(argc, argv, 0, clblast::XgerGetTunerDefaults, clblast::XgerGetTunerSettings, clblast::XgerTestValidArguments, clblast::XgerSetConstraints, clblast::XgerSetArguments); break; + case clblast::Precision::kDouble: clblast::Tuner(argc, argv, 0, clblast::XgerGetTunerDefaults, clblast::XgerGetTunerSettings, clblast::XgerTestValidArguments, clblast::XgerSetConstraints, clblast::XgerSetArguments); break; + case clblast::Precision::kComplexSingle: clblast::Tuner(argc, argv, 0, clblast::XgerGetTunerDefaults, clblast::XgerGetTunerSettings, clblast::XgerTestValidArguments, clblast::XgerSetConstraints, clblast::XgerSetArguments); break; + case clblast::Precision::kComplexDouble: clblast::Tuner(argc, argv, 0, clblast::XgerGetTunerDefaults, clblast::XgerGetTunerSettings, clblast::XgerTestValidArguments, clblast::XgerSetConstraints, clblast::XgerSetArguments); break; } return 0; } diff --git a/src/tuning/kernels/xger.hpp b/src/tuning/kernels/xger.hpp index 01d85c9e..afd2f36e 100644 --- a/src/tuning/kernels/xger.hpp +++ b/src/tuning/kernels/xger.hpp @@ -21,7 +21,7 @@ namespace clblast { // ================================================================================================= // Settings for this kernel (default command-line arguments) -TunerDefaults GetTunerDefaults(const int) { +TunerDefaults XgerGetTunerDefaults(const int) { auto settings = TunerDefaults(); settings.options = {kArgM, kArgN, kArgAlpha}; settings.default_m = 1024; @@ -31,7 +31,7 @@ TunerDefaults GetTunerDefaults(const int) { // Settings for this kernel (general) template -TunerSettings GetTunerSettings(const int, const Arguments &args) { +TunerSettings XgerGetTunerSettings(const int, const Arguments &args) { auto settings = TunerSettings(); // Identification of the kernel @@ -77,12 +77,12 @@ TunerSettings GetTunerSettings(const int, const Arguments &args) { // Tests for valid arguments template -void TestValidArguments(const int, const Arguments &) { } -std::vector SetConstraints(const int) { return {}; } +void XgerTestValidArguments(const int, const Arguments &) { } +std::vector XgerSetConstraints(const int) { return {}; } // Sets the kernel's arguments template -void SetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { +void XgerSetArguments(const int, Kernel &kernel, const Arguments &args, std::vector>& buffers) { kernel.SetArgument(0, static_cast(args.m)); kernel.SetArgument(1, static_cast(args.n)); kernel.SetArgument(2, GetRealArg(args.alpha)); -- cgit v1.2.3