diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2017-12-30 21:17:31 +0100 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2017-12-30 21:17:31 +0100 |
commit | 7ce415b9276e1d99f145741487f36a9034e5e035 (patch) | |
tree | bd41be7ad7eb868ae459b9644fbe751fccb28974 /src/kernels | |
parent | 407ed52cec41445f02e85cb45d08f590960216bb (diff) |
Fixed ifdef's into ifndef's
Diffstat (limited to 'src/kernels')
-rw-r--r-- | src/kernels/level3/invert_diagonal_blocks_part1.opencl | 14 | ||||
-rw-r--r-- | src/kernels/level3/invert_diagonal_blocks_part2.opencl | 4 |
2 files changed, 9 insertions, 9 deletions
diff --git a/src/kernels/level3/invert_diagonal_blocks_part1.opencl b/src/kernels/level3/invert_diagonal_blocks_part1.opencl index 8c210c9e..8da019e9 100644 --- a/src/kernels/level3/invert_diagonal_blocks_part1.opencl +++ b/src/kernels/level3/invert_diagonal_blocks_part1.opencl @@ -112,7 +112,7 @@ void InvertDiagonalBlock(int n, __global const real* restrict src, const int src // Local memory to store the inverted block of INTERNAL_BLOCK_SIZE by INTERNAL_BLOCK_SIZE __local real lm[INTERNAL_BLOCK_SIZE][INTERNAL_BLOCK_SIZE]; -#ifdef DISABLE_PART1 +#ifndef DISABLE_PART1 // Loads the source lower triangle into local memory. Any values in the upper triangle or // outside of the matrix are set to zero #pragma unroll @@ -133,7 +133,7 @@ void InvertDiagonalBlock(int n, __global const real* restrict src, const int src } barrier(CLK_LOCAL_MEM_FENCE); #endif -#ifdef DISABLE_PART2 +#ifndef DISABLE_PART2 // Inverts the diagonal real inverted_diagonal; SetToOne(inverted_diagonal); @@ -148,7 +148,7 @@ void InvertDiagonalBlock(int n, __global const real* restrict src, const int src lm[thread_index][thread_index] = inverted_diagonal; barrier(CLK_LOCAL_MEM_FENCE); #endif -#ifdef DISABLE_PART3 +#ifndef DISABLE_PART3 // Upper-triangular if (is_upper) { @@ -231,7 +231,7 @@ INLINE_FUNC void TripleMatMul(const int size, const bool upper, const int part, for (int _j = 0; _j < 16; _j += 1) { SetToZero(cpm[_j]); } -#ifdef DISABLE_PART4 +#ifndef DISABLE_PART4 // Computes NT x 16 block of C, each thread computes one 1 x 16 row for (int k = 0; k < current_size; k += 16) { @@ -277,7 +277,7 @@ INLINE_FUNC void TripleMatMul(const int size, const bool upper, const int part, barrier(CLK_LOCAL_MEM_FENCE); } #endif -#ifdef DISABLE_PART5 +#ifndef DISABLE_PART5 // Stores NT x 16 results: each thread writes one 16 x 1 row #pragma unroll for (int _i = 0; _i < 16; _i += 1) { @@ -295,7 +295,7 @@ INLINE_FUNC void TripleMatMulPart1(const int size, const bool upper, LOCAL_PTR r __global const real* src, const int a_offset, const int lda, __global real* dest, int current_size, int num_pages, const int block_size) { -#ifdef DISABLE_PART6 +#ifndef DISABLE_PART6 // Emulates a 3D grid: NX * (NY * num_pages) const int page = get_group_id(1) % num_pages; @@ -332,7 +332,7 @@ INLINE_FUNC void TripleMatMulPart1(const int size, const bool upper, LOCAL_PTR r INLINE_FUNC void TripleMatMulPart2(const int size, const bool upper, LOCAL_PTR real* blm, const int n, __global real* dest, int current_size, int num_pages, const int block_size) { -#ifdef DISABLE_PART7 +#ifndef DISABLE_PART7 // Emulates a 3D grid: NX * (NY * num_pages) const int page = get_group_id(1) % num_pages; diff --git a/src/kernels/level3/invert_diagonal_blocks_part2.opencl b/src/kernels/level3/invert_diagonal_blocks_part2.opencl index 37210f77..22d8e5d7 100644 --- a/src/kernels/level3/invert_diagonal_blocks_part2.opencl +++ b/src/kernels/level3/invert_diagonal_blocks_part2.opencl @@ -18,7 +18,7 @@ R"( // ================================================================================================= #if defined(ROUTINE_INVERT) -#ifdef DISABLE_PART8 +#ifndef DISABLE_PART8 // B21 = A21 * B11 __kernel __attribute__((reqd_work_group_size(1 * TMMWGSX, TMMWGSY, 1))) void TripleMatMul16Part1Lower(int n, __global const real* restrict src, const int a_offset, const int lda, @@ -72,7 +72,7 @@ void TripleMatMul64Part2Lower(int n, __global real* restrict dest, int current_s #endif // ================================================================================================= -#ifdef DISABLE_PART9 +#ifndef DISABLE_PART9 // B12 = A12 * B22 __kernel __attribute__((reqd_work_group_size(1 * TMMWGSX, TMMWGSY, 1))) void TripleMatMul16Part1Upper(int n, __global const real* restrict src, const int a_offset, const int lda, |