summaryrefslogtreecommitdiff
path: root/src/kernels
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-12-30 21:17:31 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2017-12-30 21:17:31 +0100
commit7ce415b9276e1d99f145741487f36a9034e5e035 (patch)
treebd41be7ad7eb868ae459b9644fbe751fccb28974 /src/kernels
parent407ed52cec41445f02e85cb45d08f590960216bb (diff)
Fixed ifdef's into ifndef's
Diffstat (limited to 'src/kernels')
-rw-r--r--src/kernels/level3/invert_diagonal_blocks_part1.opencl14
-rw-r--r--src/kernels/level3/invert_diagonal_blocks_part2.opencl4
2 files changed, 9 insertions, 9 deletions
diff --git a/src/kernels/level3/invert_diagonal_blocks_part1.opencl b/src/kernels/level3/invert_diagonal_blocks_part1.opencl
index 8c210c9e..8da019e9 100644
--- a/src/kernels/level3/invert_diagonal_blocks_part1.opencl
+++ b/src/kernels/level3/invert_diagonal_blocks_part1.opencl
@@ -112,7 +112,7 @@ void InvertDiagonalBlock(int n, __global const real* restrict src, const int src
// Local memory to store the inverted block of INTERNAL_BLOCK_SIZE by INTERNAL_BLOCK_SIZE
__local real lm[INTERNAL_BLOCK_SIZE][INTERNAL_BLOCK_SIZE];
-#ifdef DISABLE_PART1
+#ifndef DISABLE_PART1
// Loads the source lower triangle into local memory. Any values in the upper triangle or
// outside of the matrix are set to zero
#pragma unroll
@@ -133,7 +133,7 @@ void InvertDiagonalBlock(int n, __global const real* restrict src, const int src
}
barrier(CLK_LOCAL_MEM_FENCE);
#endif
-#ifdef DISABLE_PART2
+#ifndef DISABLE_PART2
// Inverts the diagonal
real inverted_diagonal;
SetToOne(inverted_diagonal);
@@ -148,7 +148,7 @@ void InvertDiagonalBlock(int n, __global const real* restrict src, const int src
lm[thread_index][thread_index] = inverted_diagonal;
barrier(CLK_LOCAL_MEM_FENCE);
#endif
-#ifdef DISABLE_PART3
+#ifndef DISABLE_PART3
// Upper-triangular
if (is_upper) {
@@ -231,7 +231,7 @@ INLINE_FUNC void TripleMatMul(const int size, const bool upper, const int part,
for (int _j = 0; _j < 16; _j += 1) {
SetToZero(cpm[_j]);
}
-#ifdef DISABLE_PART4
+#ifndef DISABLE_PART4
// Computes NT x 16 block of C, each thread computes one 1 x 16 row
for (int k = 0; k < current_size; k += 16) {
@@ -277,7 +277,7 @@ INLINE_FUNC void TripleMatMul(const int size, const bool upper, const int part,
barrier(CLK_LOCAL_MEM_FENCE);
}
#endif
-#ifdef DISABLE_PART5
+#ifndef DISABLE_PART5
// Stores NT x 16 results: each thread writes one 16 x 1 row
#pragma unroll
for (int _i = 0; _i < 16; _i += 1) {
@@ -295,7 +295,7 @@ INLINE_FUNC void TripleMatMulPart1(const int size, const bool upper, LOCAL_PTR r
__global const real* src, const int a_offset, const int lda,
__global real* dest, int current_size, int num_pages, const int block_size) {
-#ifdef DISABLE_PART6
+#ifndef DISABLE_PART6
// Emulates a 3D grid: NX * (NY * num_pages)
const int page = get_group_id(1) % num_pages;
@@ -332,7 +332,7 @@ INLINE_FUNC void TripleMatMulPart1(const int size, const bool upper, LOCAL_PTR r
INLINE_FUNC void TripleMatMulPart2(const int size, const bool upper, LOCAL_PTR real* blm, const int n,
__global real* dest, int current_size, int num_pages, const int block_size) {
-#ifdef DISABLE_PART7
+#ifndef DISABLE_PART7
// Emulates a 3D grid: NX * (NY * num_pages)
const int page = get_group_id(1) % num_pages;
diff --git a/src/kernels/level3/invert_diagonal_blocks_part2.opencl b/src/kernels/level3/invert_diagonal_blocks_part2.opencl
index 37210f77..22d8e5d7 100644
--- a/src/kernels/level3/invert_diagonal_blocks_part2.opencl
+++ b/src/kernels/level3/invert_diagonal_blocks_part2.opencl
@@ -18,7 +18,7 @@ R"(
// =================================================================================================
#if defined(ROUTINE_INVERT)
-#ifdef DISABLE_PART8
+#ifndef DISABLE_PART8
// B21 = A21 * B11
__kernel __attribute__((reqd_work_group_size(1 * TMMWGSX, TMMWGSY, 1)))
void TripleMatMul16Part1Lower(int n, __global const real* restrict src, const int a_offset, const int lda,
@@ -72,7 +72,7 @@ void TripleMatMul64Part2Lower(int n, __global real* restrict dest, int current_s
#endif
// =================================================================================================
-#ifdef DISABLE_PART9
+#ifndef DISABLE_PART9
// B12 = A12 * B22
__kernel __attribute__((reqd_work_group_size(1 * TMMWGSX, TMMWGSY, 1)))
void TripleMatMul16Part1Upper(int n, __global const real* restrict src, const int a_offset, const int lda,