From 306bf67660da4f1adacaedf9066925240abf4ea9 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Sun, 6 Mar 2016 15:48:11 +0100 Subject: Added preliminary support for xHPR2 and xSPR2 routines --- include/internal/routines/level2/xhpr2.h | 46 ++++++++++++++++++++++++++++++++ include/internal/routines/level2/xspr2.h | 46 ++++++++++++++++++++++++++++++++ 2 files changed, 92 insertions(+) create mode 100644 include/internal/routines/level2/xhpr2.h create mode 100644 include/internal/routines/level2/xspr2.h (limited to 'include') diff --git a/include/internal/routines/level2/xhpr2.h b/include/internal/routines/level2/xhpr2.h new file mode 100644 index 00000000..fd243d33 --- /dev/null +++ b/include/internal/routines/level2/xhpr2.h @@ -0,0 +1,46 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren +// +// This file implements the Xhpr2 routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XHPR2_H_ +#define CLBLAST_ROUTINES_XHPR2_H_ + +#include "internal/routines/level2/xher2.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template +class Xhpr2: public Xher2 { + public: + + // Uses the regular Xher2 routine + using Xher2::DoHer2; + + // Constructor + Xhpr2(Queue &queue, Event &event, const std::string &name = "HPR2"); + + // Templated-precision implementation of the routine + StatusCode DoHpr2(const Layout layout, const Triangle triangle, + const size_t n, + const T alpha, + const Buffer &x_buffer, const size_t x_offset, const size_t x_inc, + const Buffer &y_buffer, const size_t y_offset, const size_t y_inc, + const Buffer &ap_buffer, const size_t ap_offset); +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XHPR2_H_ +#endif diff --git a/include/internal/routines/level2/xspr2.h b/include/internal/routines/level2/xspr2.h new file mode 100644 index 00000000..3d5f4992 --- /dev/null +++ b/include/internal/routines/level2/xspr2.h @@ -0,0 +1,46 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren +// +// This file implements the Xspr2 routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XSPR2_H_ +#define CLBLAST_ROUTINES_XSPR2_H_ + +#include "internal/routines/level2/xher2.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template +class Xspr2: public Xher2 { + public: + + // Uses the regular Xher2 routine + using Xher2::DoHer2; + + // Constructor + Xspr2(Queue &queue, Event &event, const std::string &name = "SPR2"); + + // Templated-precision implementation of the routine + StatusCode DoSpr2(const Layout layout, const Triangle triangle, + const size_t n, + const T alpha, + const Buffer &x_buffer, const size_t x_offset, const size_t x_inc, + const Buffer &y_buffer, const size_t y_offset, const size_t y_inc, + const Buffer &ap_buffer, const size_t ap_offset); +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XSPR2_H_ +#endif -- cgit v1.2.3