summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorCedric Nugteren <web@cedricnugteren.nl>2017-11-08 21:20:07 +0100
committerCedric Nugteren <web@cedricnugteren.nl>2017-11-08 21:20:07 +0100
commitd24138808b42368a4dfe67fc9bdef546b6c358e8 (patch)
tree584aa01ff1f9c8fd225b5ec075d0a9e01178b016
parentb18cc9d3f18accf88c9551c98c51b99add57b96c (diff)
Fixed an FP16 issue in the homatcopy test; added a comment about improper testing of integer returning functions for FP16
-rw-r--r--README.md4
-rw-r--r--test/routines/levelx/xomatcopy.hpp2
2 files changed, 5 insertions, 1 deletions
diff --git a/README.md b/README.md
index 8a0fe17a..44163e7e 100644
--- a/README.md
+++ b/README.md
@@ -368,6 +368,10 @@ Known performance related issues:
* Performance issues on ARM Mali GPUs due to missing compiler for support for loop unrolling and array-to-register promotion.
+Other known issues:
+
+* Routines returning an integer are currently not properly tested for half-precision FP16: IHAMAX/IHAMIN/IHMAX/IHMIN
+
Contributing
-------------
diff --git a/test/routines/levelx/xomatcopy.hpp b/test/routines/levelx/xomatcopy.hpp
index 70bda452..477d6da6 100644
--- a/test/routines/levelx/xomatcopy.hpp
+++ b/test/routines/levelx/xomatcopy.hpp
@@ -65,7 +65,7 @@ StatusCode RunReference<half>(const Arguments<half> &args, BuffersHost<half> &bu
args2.layout = args.layout; args2.a_transpose = args.a_transpose;
args2.alpha = HalfToFloat(args.alpha);
auto status = RunReference(args2, buffers2);
- FloatToHalfBuffer(buffers_host.b_mat, b_buffer2);
+ FloatToHalfBuffer(buffers_host.b_mat, buffers2.b_mat);
return status;
}