From 52ccaf5b25e14c9ce032315e5e96b1f27886d481 Mon Sep 17 00:00:00 2001 From: Cedric Nugteren Date: Thu, 16 Jun 2016 18:07:46 +0200 Subject: Added XOMATCOPY routines to perform out-of-place matrix scaling, copying, and/or transposing --- src/tuning/copy_pad.cc | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) (limited to 'src/tuning/copy_pad.cc') diff --git a/src/tuning/copy_pad.cc b/src/tuning/copy_pad.cc index ec392471..7088b3bf 100644 --- a/src/tuning/copy_pad.cc +++ b/src/tuning/copy_pad.cc @@ -37,7 +37,7 @@ class TunePad { } // The list of arguments relevant for this routine - static std::vector GetOptions() { return {kArgM, kArgN}; } + static std::vector GetOptions() { return {kArgM, kArgN, kArgAlpha}; } // Tests for valid arguments static void TestValidArguments(const Arguments &) { } @@ -86,6 +86,7 @@ class TunePad { std::vector &, std::vector &, std::vector &a_mat, std::vector &b_mat, std::vector &, std::vector &) { + auto alpha_buffer = std::vector{args.alpha}; tuner.AddArgumentScalar(static_cast(args.m)); tuner.AddArgumentScalar(static_cast(args.n)); tuner.AddArgumentScalar(static_cast(args.m)); @@ -96,6 +97,7 @@ class TunePad { tuner.AddArgumentScalar(static_cast(args.m)); tuner.AddArgumentScalar(0); tuner.AddArgumentOutput(b_mat); + tuner.AddArgumentInput(alpha_buffer); tuner.AddArgumentScalar(0); } -- cgit v1.2.3