summaryrefslogtreecommitdiff
path: root/test/correctness/testblas.cc
diff options
context:
space:
mode:
authorCNugteren <web@cedricnugteren.nl>2015-06-28 15:52:57 +0200
committerCNugteren <web@cedricnugteren.nl>2015-06-28 15:52:57 +0200
commite5c0edbfd7dcfe96af6cca6c25ca8b346871b014 (patch)
tree3b2cd30c04434a914de9faa5af7ee40609c75656 /test/correctness/testblas.cc
parentcf1892d22ca9647dc8bb1025253e65152fef2466 (diff)
Re-organized the test infrastructure to avoid code duplication
Diffstat (limited to 'test/correctness/testblas.cc')
-rw-r--r--test/correctness/testblas.cc185
1 files changed, 185 insertions, 0 deletions
diff --git a/test/correctness/testblas.cc b/test/correctness/testblas.cc
new file mode 100644
index 00000000..019d93ee
--- /dev/null
+++ b/test/correctness/testblas.cc
@@ -0,0 +1,185 @@
+
+// =================================================================================================
+// This file is part of the CLBlast project. The project is licensed under the MIT license. This
+// project loosely follows the Google C++ styleguide and uses a tab-size of two spaces and a max-
+// width of 100 characters per line.
+//
+// Author(s):
+// Cedric Nugteren <www.cedricnugteren.nl>
+//
+// This file implements the TestBlas class (see the header for information about the class).
+//
+// =================================================================================================
+
+#include <algorithm>
+
+#include "correctness/testblas.h"
+
+namespace clblast {
+// =================================================================================================
+
+// The transpose-options to test with (data-type dependent)
+template <> const std::vector<Transpose> TestBlas<float>::kTransposes = {Transpose::kNo, Transpose::kYes};
+template <> const std::vector<Transpose> TestBlas<double>::kTransposes = {Transpose::kNo, Transpose::kYes};
+template <> const std::vector<Transpose> TestBlas<float2>::kTransposes = {Transpose::kNo, Transpose::kYes, Transpose::kConjugate};
+template <> const std::vector<Transpose> TestBlas<double2>::kTransposes = {Transpose::kNo, Transpose::kYes, Transpose::kConjugate};
+
+// =================================================================================================
+
+// Constructor, initializes the base class tester and input data
+template <typename T>
+TestBlas<T>::TestBlas(int argc, char *argv[], const bool silent,
+ const std::string &name, const std::vector<std::string> &options,
+ const Routine run_routine, const Routine run_reference,
+ const ResultGet get_result, const ResultIndex get_index,
+ const ResultIterator get_id1, const ResultIterator get_id2):
+ Tester<T>{argc, argv, silent, name, options},
+ run_routine_(run_routine),
+ run_reference_(run_reference),
+ get_result_(get_result),
+ get_index_(get_index),
+ get_id1_(get_id1),
+ get_id2_(get_id2) {
+
+ // Computes the maximum sizes. This allows for a single set of input/output buffers.
+ auto max_vec = *std::max_element(kVectorDims.begin(), kVectorDims.end());
+ auto max_inc = *std::max_element(kIncrements.begin(), kIncrements.end());
+ auto max_mat = *std::max_element(kMatrixDims.begin(), kMatrixDims.end());
+ auto max_ld = *std::max_element(kMatrixDims.begin(), kMatrixDims.end());
+ auto max_matvec = *std::max_element(kMatrixVectorDims.begin(), kMatrixVectorDims.end());
+ auto max_offset = *std::max_element(kOffsets.begin(), kOffsets.end());
+
+ // Creates test input data
+ x_source_.resize(std::max(max_vec, max_matvec)*max_inc + max_offset);
+ y_source_.resize(std::max(max_vec, max_matvec)*max_inc + max_offset);
+ a_source_.resize(std::max(max_mat, max_matvec)*std::max(max_ld, max_matvec) + max_offset);
+ b_source_.resize(std::max(max_mat, max_matvec)*std::max(max_ld, max_matvec) + max_offset);
+ c_source_.resize(std::max(max_mat, max_matvec)*std::max(max_ld, max_matvec) + max_offset);
+ PopulateVector(x_source_);
+ PopulateVector(y_source_);
+ PopulateVector(a_source_);
+ PopulateVector(b_source_);
+ PopulateVector(c_source_);
+}
+
+// ===============================================================================================
+
+// Tests the routine for a wide variety of parameters
+template <typename T>
+void TestBlas<T>::TestRegular(std::vector<Arguments<T>> &test_vector, const std::string &name) {
+ if (!PrecisionSupported()) { return; }
+ TestStart("regular behaviour", name);
+
+ // Iterates over all the to-be-tested combinations of arguments
+ for (auto &args: test_vector) {
+
+ // Runs the reference clBLAS code
+ auto x_vec1 = Buffer(context_, CL_MEM_READ_WRITE, args.x_size*sizeof(T));
+ auto y_vec1 = Buffer(context_, CL_MEM_READ_WRITE, args.y_size*sizeof(T));
+ auto a_mat1 = Buffer(context_, CL_MEM_READ_WRITE, args.a_size*sizeof(T));
+ auto b_mat1 = Buffer(context_, CL_MEM_READ_WRITE, args.b_size*sizeof(T));
+ auto c_mat1 = Buffer(context_, CL_MEM_READ_WRITE, args.c_size*sizeof(T));
+ x_vec1.WriteBuffer(queue_, args.x_size*sizeof(T), x_source_);
+ y_vec1.WriteBuffer(queue_, args.y_size*sizeof(T), y_source_);
+ a_mat1.WriteBuffer(queue_, args.a_size*sizeof(T), a_source_);
+ b_mat1.WriteBuffer(queue_, args.b_size*sizeof(T), b_source_);
+ c_mat1.WriteBuffer(queue_, args.c_size*sizeof(T), c_source_);
+ auto buffers1 = Buffers{x_vec1, y_vec1, a_mat1, b_mat1, c_mat1};
+ auto status1 = run_reference_(args, buffers1, queue_);
+
+ // Runs the CLBlast code
+ auto x_vec2 = Buffer(context_, CL_MEM_READ_WRITE, args.x_size*sizeof(T));
+ auto y_vec2 = Buffer(context_, CL_MEM_READ_WRITE, args.y_size*sizeof(T));
+ auto a_mat2 = Buffer(context_, CL_MEM_READ_WRITE, args.a_size*sizeof(T));
+ auto b_mat2 = Buffer(context_, CL_MEM_READ_WRITE, args.b_size*sizeof(T));
+ auto c_mat2 = Buffer(context_, CL_MEM_READ_WRITE, args.c_size*sizeof(T));
+ x_vec2.WriteBuffer(queue_, args.x_size*sizeof(T), x_source_);
+ y_vec2.WriteBuffer(queue_, args.y_size*sizeof(T), y_source_);
+ a_mat2.WriteBuffer(queue_, args.a_size*sizeof(T), a_source_);
+ b_mat2.WriteBuffer(queue_, args.b_size*sizeof(T), b_source_);
+ c_mat2.WriteBuffer(queue_, args.c_size*sizeof(T), c_source_);
+ auto buffers2 = Buffers{x_vec2, y_vec2, a_mat2, b_mat2, c_mat2};
+ auto status2 = run_routine_(args, buffers2, queue_);
+
+ // Tests for equality of the two status codes
+ if (status1 != StatusCode::kSuccess || status2 != StatusCode::kSuccess) {
+ TestErrorCodes(status1, status2, args);
+ continue;
+ }
+
+ // Downloads the results
+ auto result1 = get_result_(args, buffers1, queue_);
+ auto result2 = get_result_(args, buffers2, queue_);
+
+ // Checks for differences in the output
+ auto errors = size_t{0};
+ for (auto id1=size_t{0}; id1<get_id1_(args); ++id1) {
+ for (auto id2=size_t{0}; id2<get_id2_(args); ++id2) {
+ auto index = get_index_(args, id1, id2);
+ if (!TestSimilarity(result1[index], result2[index])) {
+ errors++;
+ }
+ }
+ }
+
+ // Tests the error count (should be zero)
+ TestErrorCount(errors, get_id1_(args)*get_id2_(args), args);
+ }
+ TestEnd();
+}
+
+// =================================================================================================
+
+// Tests the routine for cases with invalid OpenCL memory buffer sizes. Tests only on return-types,
+// does not test for results (if any).
+template <typename T>
+void TestBlas<T>::TestInvalid(std::vector<Arguments<T>> &test_vector, const std::string &name) {
+ if (!PrecisionSupported()) { return; }
+ TestStart("invalid buffer sizes", name);
+
+ // Iterates over all the to-be-tested combinations of arguments
+ for (auto &args: test_vector) {
+
+ // Creates the OpenCL buffers. Note: we are not using the C++ version since we explicitly
+ // want to be able to create invalid buffers (no error checking here).
+ auto x1 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.x_size*sizeof(T), nullptr,nullptr);
+ auto y1 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.y_size*sizeof(T), nullptr,nullptr);
+ auto a1 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.a_size*sizeof(T), nullptr,nullptr);
+ auto b1 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.b_size*sizeof(T), nullptr,nullptr);
+ auto c1 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.c_size*sizeof(T), nullptr,nullptr);
+ auto x_vec1 = Buffer(x1);
+ auto y_vec1 = Buffer(y1);
+ auto a_mat1 = Buffer(a1);
+ auto b_mat1 = Buffer(b1);
+ auto c_mat1 = Buffer(c1);
+ auto x2 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.x_size*sizeof(T), nullptr,nullptr);
+ auto y2 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.y_size*sizeof(T), nullptr,nullptr);
+ auto a2 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.a_size*sizeof(T), nullptr,nullptr);
+ auto b2 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.b_size*sizeof(T), nullptr,nullptr);
+ auto c2 = clCreateBuffer(context_(), CL_MEM_READ_WRITE, args.c_size*sizeof(T), nullptr,nullptr);
+ auto x_vec2 = Buffer(x2);
+ auto y_vec2 = Buffer(y2);
+ auto a_mat2 = Buffer(a2);
+ auto b_mat2 = Buffer(b2);
+ auto c_mat2 = Buffer(c2);
+
+ // Runs the two routines
+ auto status1 = run_reference_(args, Buffers{x_vec1, y_vec1, a_mat1, b_mat1, c_mat1}, queue_);
+ auto status2 = run_routine_(args, Buffers{x_vec2, y_vec2, a_mat2, b_mat2, c_mat2}, queue_);
+
+ // Tests for equality of the two status codes
+ TestErrorCodes(status1, status2, args);
+ }
+ TestEnd();
+}
+
+// =================================================================================================
+
+// Compiles the templated class
+template class TestBlas<float>;
+template class TestBlas<double>;
+template class TestBlas<float2>;
+template class TestBlas<double2>;
+
+// =================================================================================================
+} // namespace clblast