summaryrefslogtreecommitdiff
path: root/include
diff options
context:
space:
mode:
authorcnugteren <web@cedricnugteren.nl>2016-04-20 22:12:51 -0600
committercnugteren <web@cedricnugteren.nl>2016-04-20 22:12:51 -0600
commit16a048f1ac8102ad4bcce9cf9fc320f791323e45 (patch)
treebd7df539c92b92cb8841ff27fd83c4e14e5958bc /include
parent894983fc3c7c57ffc48c21523641694cde318eca (diff)
Added support for the iSAMAX/iDAMAX/iCAMAX/iZAMAX routines
Diffstat (limited to 'include')
-rw-r--r--include/internal/routines/level1/xamax.h56
-rw-r--r--include/internal/utilities.h2
2 files changed, 58 insertions, 0 deletions
diff --git a/include/internal/routines/level1/xamax.h b/include/internal/routines/level1/xamax.h
new file mode 100644
index 00000000..b815e8d2
--- /dev/null
+++ b/include/internal/routines/level1/xamax.h
@@ -0,0 +1,56 @@
+
+// =================================================================================================
+// This file is part of the CLBlast project. The project is licensed under Apache Version 2.0. This
+// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max-
+// width of 100 characters per line.
+//
+// Author(s):
+// Cedric Nugteren <www.cedricnugteren.nl>
+//
+// This file implements the Xamax routine. The precision is implemented using a template argument.
+//
+// =================================================================================================
+
+#ifndef CLBLAST_ROUTINES_XAMAX_H_
+#define CLBLAST_ROUTINES_XAMAX_H_
+
+#include "internal/routine.h"
+
+namespace clblast {
+// =================================================================================================
+
+// See comment at top of file for a description of the class
+template <typename T>
+class Xamax: public Routine<T> {
+ public:
+
+ // Members and methods from the base class
+ using Routine<T>::db_;
+ using Routine<T>::source_string_;
+ using Routine<T>::queue_;
+ using Routine<T>::event_;
+ using Routine<T>::context_;
+ using Routine<T>::GetProgramFromCache;
+ using Routine<T>::TestVectorX;
+ using Routine<T>::TestVectorDot;
+ using Routine<T>::RunKernel;
+ using Routine<T>::ErrorIn;
+
+ // Constructor
+ Xamax(Queue &queue, EventPointer event, const std::string &name = "AMAX");
+
+ // Templated-precision implementation of the routine
+ StatusCode DoAmax(const size_t n,
+ const Buffer<T> &imax_buffer, const size_t imax_offset,
+ const Buffer<T> &x_buffer, const size_t x_offset, const size_t x_inc);
+
+ private:
+ // Static variable to get the precision
+ const static Precision precision_;
+};
+
+// =================================================================================================
+} // namespace clblast
+
+// CLBLAST_ROUTINES_XAMAX_H_
+#endif
diff --git a/include/internal/utilities.h b/include/internal/utilities.h
index 8ffdc3af..75b3d27d 100644
--- a/include/internal/utilities.h
+++ b/include/internal/utilities.h
@@ -66,6 +66,7 @@ constexpr auto kArgAPOffset = "offap";
constexpr auto kArgDotOffset = "offdot";
constexpr auto kArgNrm2Offset = "offnrm2";
constexpr auto kArgAsumOffset = "offasum";
+constexpr auto kArgImaxOffset = "offimax";
constexpr auto kArgAlpha = "alpha";
constexpr auto kArgBeta = "beta";
@@ -121,6 +122,7 @@ struct Arguments {
size_t dot_offset = 0;
size_t nrm2_offset = 0;
size_t asum_offset = 0;
+ size_t imax_offset = 0;
T alpha = T{1.0};
T beta = T{1.0};
size_t x_size = 1;