diff options
author | Cedric Nugteren <web@cedricnugteren.nl> | 2017-01-18 21:29:59 +0100 |
---|---|---|
committer | Cedric Nugteren <web@cedricnugteren.nl> | 2017-01-18 21:29:59 +0100 |
commit | df9a77d74d87fb8832264e9e9a37336001873151 (patch) | |
tree | 516e113140164daa0d918803dee64b94b685afb6 /src/kernels/level3/level3.opencl | |
parent | 4b3ffd998904f5c848edc5917308f5942fa71da3 (diff) |
Added first version of the TRSM routine based on the diagonal invert kernel
Diffstat (limited to 'src/kernels/level3/level3.opencl')
-rw-r--r-- | src/kernels/level3/level3.opencl | 16 |
1 files changed, 16 insertions, 0 deletions
diff --git a/src/kernels/level3/level3.opencl b/src/kernels/level3/level3.opencl index bf14ab12..0f5a8607 100644 --- a/src/kernels/level3/level3.opencl +++ b/src/kernels/level3/level3.opencl @@ -74,6 +74,22 @@ R"( #endif // ================================================================================================= +#if defined(ROUTINE_INVERT) || defined(ROUTINE_TRSM) + +__kernel __attribute__((reqd_work_group_size(8, 8, 1))) +void FillMatrix(const int n, const int ld, const int offset, + __global real* restrict dest, const real_arg arg_value) { + const real value = GetRealArg(arg_value); + const int id_one = get_global_id(0); + const int id_two = get_global_id(1); + if (id_one < ld && id_two < n) { + dest[id_two*ld + id_one + offset] = value; + } +} + +#endif + +// ================================================================================================= // End of the C++11 raw string literal )" |