1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
|
/* ************************************************************************
* Copyright 2013 Advanced Micro Devices, Inc.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
* ************************************************************************/
#include <sstream>
#include "symv.h"
using namespace clMath;
SymvStep::SymvStep(cl_device_id device) :
Step(CLBLAS_SYMV, device)
{
}
SymvStep::SymvStep(ListNode *node) :
Step(node)
{
}
void
SymvStep::declareVars(Step *masterStep)
{
StepKargs args;
MatrixVariable *A;
VectorVariable *X, *Y, *naiveY;
memset(&args, 0, sizeof(args));
std::string type = dtypeToString(kargs().dtype);
args.N = addConst("N", "cl_uint", kargs().N);
args.K = args.N;
args.lda = addConst("lda", "cl_uint", kargs().lda.matrix);
args.ldb = addConst("incx", "cl_int", kargs().ldb.vector);
args.ldc = addConst("incy", "cl_int", kargs().ldc.vector);
args.offsetN = addConst("offsetN", "cl_uint", kargs().offsetN);
args.offA = addConst("offA", "cl_uint", kargs().offA);
args.offBX = addConst("offx", "cl_uint", kargs().offBX);
args.offCY = addConst("offy", "cl_uint", kargs().offCY);
args.alpha = addVar("alpha", type,
multiplierToString(kargs().dtype, kargs().alpha));
args.beta = addVar("beta", type,
multiplierToString(kargs().dtype, kargs().beta));
A = addMatrix("A", type + "*", args.N, args.N, args.lda, args.offA);
X = addVector("X", type + "*", args.N, args.ldb, args.offBX);
Y = addVector("Y", type + "*", args.N, args.ldc, args.offCY);
naiveY = addVector("naiveY", type + "*", args.N, args.ldc, args.offCY);
naiveY->setCopy(Y);
std::string bufAName, bufBName, bufCName;
if (NULL == masterStep) {
bufAName = "bufA";
bufBName = "bufX";
bufCName = "bufY";
}
else {
bufAName = masterStep->getBuffer((BufferID)(long)step_.args.A)->name();
bufBName = masterStep->getBuffer((BufferID)(long)step_.args.B)->name();
bufCName = masterStep->getBuffer((BufferID)(long)step_.args.C)->name();
}
args.A = addBuffer(BUFFER_A, bufAName, "cl_mem", CL_MEM_READ_ONLY, A);
args.B = addBuffer(BUFFER_B, bufBName, "cl_mem", CL_MEM_READ_ONLY, X);
args.C = addBuffer(BUFFER_C, bufCName, "cl_mem", CL_MEM_READ_WRITE, Y);
assignKargs(args);
std::stringstream ss;
ss << getBlasFunctionName() << "(order, uplo, "
<< args.N->name() << ", "
<< args.alpha->name() << ", " << A->matrixPointer() << ", "
<< args.lda->name() << ", " << X->vectorPointer() << ", "
<< args.ldb->name() << ", " << args.beta->name() << ", "
<< naiveY->vectorPointer() << ", " << args.ldc->name() << ")";
naiveCall_ = ss.str();
ss.str("");
ss << "compareVectors(" << args.N->name() << ", " << Y->vectorPointer()
<< ", " << naiveY->vectorPointer() << ", " << args.ldc->name() << ")";
compareCall_ = ss.str();
}
void
SymvStep::fixLD()
{
CLBlasKargs args;
args = kargs();
if (args.lda.matrix < args.N) {
args.lda.matrix = args.N;
}
if (args.ldb.vector == 0) {
args.ldb.vector = 1;
}
if (args.ldc.vector == 0) {
args.ldc.vector = 1;
}
args.K = args.N; //store original N
setKargs(args);
}
|