diff options
author | cnugteren <web@cedricnugteren.nl> | 2016-04-20 22:12:51 -0600 |
---|---|---|
committer | cnugteren <web@cedricnugteren.nl> | 2016-04-20 22:12:51 -0600 |
commit | 16a048f1ac8102ad4bcce9cf9fc320f791323e45 (patch) | |
tree | bd7df539c92b92cb8841ff27fd83c4e14e5958bc /include/internal | |
parent | 894983fc3c7c57ffc48c21523641694cde318eca (diff) |
Added support for the iSAMAX/iDAMAX/iCAMAX/iZAMAX routines
Diffstat (limited to 'include/internal')
-rw-r--r-- | include/internal/routines/level1/xamax.h | 56 | ||||
-rw-r--r-- | include/internal/utilities.h | 2 |
2 files changed, 58 insertions, 0 deletions
diff --git a/include/internal/routines/level1/xamax.h b/include/internal/routines/level1/xamax.h new file mode 100644 index 00000000..b815e8d2 --- /dev/null +++ b/include/internal/routines/level1/xamax.h @@ -0,0 +1,56 @@ + +// ================================================================================================= +// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This +// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max- +// width of 100 characters per line. +// +// Author(s): +// Cedric Nugteren <www.cedricnugteren.nl> +// +// This file implements the Xamax routine. The precision is implemented using a template argument. +// +// ================================================================================================= + +#ifndef CLBLAST_ROUTINES_XAMAX_H_ +#define CLBLAST_ROUTINES_XAMAX_H_ + +#include "internal/routine.h" + +namespace clblast { +// ================================================================================================= + +// See comment at top of file for a description of the class +template <typename T> +class Xamax: public Routine<T> { + public: + + // Members and methods from the base class + using Routine<T>::db_; + using Routine<T>::source_string_; + using Routine<T>::queue_; + using Routine<T>::event_; + using Routine<T>::context_; + using Routine<T>::GetProgramFromCache; + using Routine<T>::TestVectorX; + using Routine<T>::TestVectorDot; + using Routine<T>::RunKernel; + using Routine<T>::ErrorIn; + + // Constructor + Xamax(Queue &queue, EventPointer event, const std::string &name = "AMAX"); + + // Templated-precision implementation of the routine + StatusCode DoAmax(const size_t n, + const Buffer<T> &imax_buffer, const size_t imax_offset, + const Buffer<T> &x_buffer, const size_t x_offset, const size_t x_inc); + + private: + // Static variable to get the precision + const static Precision precision_; +}; + +// ================================================================================================= +} // namespace clblast + +// CLBLAST_ROUTINES_XAMAX_H_ +#endif diff --git a/include/internal/utilities.h b/include/internal/utilities.h index 8ffdc3af..75b3d27d 100644 --- a/include/internal/utilities.h +++ b/include/internal/utilities.h @@ -66,6 +66,7 @@ constexpr auto kArgAPOffset = "offap"; constexpr auto kArgDotOffset = "offdot"; constexpr auto kArgNrm2Offset = "offnrm2"; constexpr auto kArgAsumOffset = "offasum"; +constexpr auto kArgImaxOffset = "offimax"; constexpr auto kArgAlpha = "alpha"; constexpr auto kArgBeta = "beta"; @@ -121,6 +122,7 @@ struct Arguments { size_t dot_offset = 0; size_t nrm2_offset = 0; size_t asum_offset = 0; + size_t imax_offset = 0; T alpha = T{1.0}; T beta = T{1.0}; size_t x_size = 1; |