summaryrefslogtreecommitdiff
path: root/src/kernels/level3/xgemm_part1.opencl
diff options
context:
space:
mode:
authorTyler Sorensen <tylersorensen3221@hotmail.com>2018-07-16 20:12:30 -0400
committerTyler Sorensen <tylersorensen3221@hotmail.com>2018-07-16 20:12:30 -0400
commit0772d63498c8eeddc380902ba6010a1a861763cc (patch)
tree3466f0a85d300853191744bf0fa7f12a78faaec1 /src/kernels/level3/xgemm_part1.opencl
parentf4e5b1c14ce9b0ac3b769908912fb3422a0ea8e2 (diff)
moved a two-line macro to a single line
Diffstat (limited to 'src/kernels/level3/xgemm_part1.opencl')
-rw-r--r--src/kernels/level3/xgemm_part1.opencl3
1 files changed, 1 insertions, 2 deletions
diff --git a/src/kernels/level3/xgemm_part1.opencl b/src/kernels/level3/xgemm_part1.opencl
index 32386312..3cfc5dfb 100644
--- a/src/kernels/level3/xgemm_part1.opencl
+++ b/src/kernels/level3/xgemm_part1.opencl
@@ -133,8 +133,7 @@ R"(
#endif
// NVIDIA warps as subgroups using inline PTX (https://docs.nvidia.com/cuda/inline-ptx-assembly/index.html)
-#if USE_SUBGROUP_SHUFFLING == 1 && (SUBGROUP_SHUFFLING_NVIDIA_PRE_VOLTA || \
- SUBGROUP_SHUFFLING_NVIDIA_POST_VOLTA)
+#if USE_SUBGROUP_SHUFFLING == 1 && (SUBGROUP_SHUFFLING_NVIDIA_PRE_VOLTA || SUBGROUP_SHUFFLING_NVIDIA_POST_VOLTA)
#define SUBGROUP_SIZE 32 // Assumes subgroup size is always 32 on NVIDIA GPUs
#endif