From e3545215a54c096e1c889124a9076cfb2f42df17 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sun, 28 Feb 2016 14:16:48 +0100 Subject: Added support for xHER, xHPR, xSYR, and xSPR routines --- include/internal/routines/level2/xher.h | 61 +++++++++++++++++++++++++++++++++ include/internal/routines/level2/xhpr.h | 45 ++++++++++++++++++++++++ include/internal/routines/level2/xspr.h | 45 ++++++++++++++++++++++++ include/internal/routines/level2/xsyr.h | 45 ++++++++++++++++++++++++ 4 files changed, 196 insertions(+) create mode 100644 include/internal/routines/level2/xher.h create mode 100644 include/internal/routines/level2/xhpr.h create mode 100644 include/internal/routines/level2/xspr.h create mode 100644 include/internal/routines/level2/xsyr.h (limited to 'include/internal') diff --git a/include/internal/routines/level2/xher.h b/include/internal/routines/level2/xher.h new file mode 100644 index 00000000..6322265b --- /dev/null +++ b/include/internal/routines/level2/xher.h @@ -0,0 +1,61 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren +// +// This file implements the Xher routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XHER_H_ +#define CLBLAST_ROUTINES_XHER_H_ + +#include "internal/routine.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template +class Xher: public Routine { + public: + + // Members and methods from the base class + using Routine::db_; + using Routine::source_string_; + using Routine::queue_; + using Routine::GetProgramFromCache; + using Routine::TestVectorX; + using Routine::TestMatrixA; + using Routine::TestMatrixAP; + using Routine::RunKernel; + using Routine::ErrorIn; + + // Constructor + Xher(Queue &queue, Event &event, const std::string &name = "HER"); + + // Translates alpha of type 'U' into type 'T' + T GetAlpha(const U alpha); + + // Templated-precision implementation of the routine + StatusCode DoHer(const Layout layout, const Triangle triangle, + const size_t n, + const U alpha, + const Buffer &x_buffer, const size_t x_offset, const size_t x_inc, + const Buffer &a_buffer, const size_t a_offset, const size_t a_ld, + const bool packed = false); + + private: + // Static variable to get the precision + const static Precision precision_; +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XHER_H_ +#endif diff --git a/include/internal/routines/level2/xhpr.h b/include/internal/routines/level2/xhpr.h new file mode 100644 index 00000000..a0c3cb92 --- /dev/null +++ b/include/internal/routines/level2/xhpr.h @@ -0,0 +1,45 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren +// +// This file implements the Xhpr routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XHPR_H_ +#define CLBLAST_ROUTINES_XHPR_H_ + +#include "internal/routines/level2/xher.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template +class Xhpr: public Xher { + public: + + // Uses the regular Xher routine + using Xher::DoHer; + + // Constructor + Xhpr(Queue &queue, Event &event, const std::string &name = "HPR"); + + // Templated-precision implementation of the routine + StatusCode DoHpr(const Layout layout, const Triangle triangle, + const size_t n, + const U alpha, + const Buffer &x_buffer, const size_t x_offset, const size_t x_inc, + const Buffer &ap_buffer, const size_t ap_offset); +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XHPR_H_ +#endif diff --git a/include/internal/routines/level2/xspr.h b/include/internal/routines/level2/xspr.h new file mode 100644 index 00000000..5b01d2cb --- /dev/null +++ b/include/internal/routines/level2/xspr.h @@ -0,0 +1,45 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren +// +// This file implements the Xspr routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XSPR_H_ +#define CLBLAST_ROUTINES_XSPR_H_ + +#include "internal/routines/level2/xher.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template +class Xspr: public Xher { + public: + + // Uses the regular Xher routine + using Xher::DoHer; + + // Constructor + Xspr(Queue &queue, Event &event, const std::string &name = "SPR"); + + // Templated-precision implementation of the routine + StatusCode DoSpr(const Layout layout, const Triangle triangle, + const size_t n, + const T alpha, + const Buffer &x_buffer, const size_t x_offset, const size_t x_inc, + const Buffer &ap_buffer, const size_t ap_offset); +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XSPR_H_ +#endif diff --git a/include/internal/routines/level2/xsyr.h b/include/internal/routines/level2/xsyr.h new file mode 100644 index 00000000..9704a881 --- /dev/null +++ b/include/internal/routines/level2/xsyr.h @@ -0,0 +1,45 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren +// +// This file implements the Xsyr routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XSYR_H_ +#define CLBLAST_ROUTINES_XSYR_H_ + +#include "internal/routines/level2/xher.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template +class Xsyr: public Xher { + public: + + // Uses the regular Xher routine + using Xher::DoHer; + + // Constructor + Xsyr(Queue &queue, Event &event, const std::string &name = "SYR"); + + // Templated-precision implementation of the routine + StatusCode DoSyr(const Layout layout, const Triangle triangle, + const size_t n, + const T alpha, + const Buffer &x_buffer, const size_t x_offset, const size_t x_inc, + const Buffer &a_buffer, const size_t a_offset, const size_t a_ld); +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XSYR_H_ +#endif -- cgit v1.2.3