summaryrefslogtreecommitdiff
path: root/external/clBLAS/src/library/tools/ktest/steps/symv.cpp
blob: bfe223029c9299f820a261da852956a418603083 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
/* ************************************************************************
 * Copyright 2013 Advanced Micro Devices, Inc.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 * ************************************************************************/


#include <sstream>

#include "symv.h"

using namespace clMath;

SymvStep::SymvStep(cl_device_id device) :
    Step(CLBLAS_SYMV, device)
{
}

SymvStep::SymvStep(ListNode *node) :
    Step(node)
{
}

void
SymvStep::declareVars(Step *masterStep)
{
    StepKargs args;
    MatrixVariable *A;
    VectorVariable *X, *Y, *naiveY;

    memset(&args, 0, sizeof(args));
    std::string type = dtypeToString(kargs().dtype);

    args.N = addConst("N", "cl_uint", kargs().N);
    args.K = args.N;

    args.lda = addConst("lda", "cl_uint", kargs().lda.matrix);
    args.ldb = addConst("incx", "cl_int", kargs().ldb.vector);
    args.ldc = addConst("incy", "cl_int", kargs().ldc.vector);

    args.offsetN = addConst("offsetN", "cl_uint", kargs().offsetN);

    args.offA = addConst("offA", "cl_uint", kargs().offA);
    args.offBX = addConst("offx", "cl_uint", kargs().offBX);
    args.offCY = addConst("offy", "cl_uint", kargs().offCY);

    args.alpha = addVar("alpha", type,
        multiplierToString(kargs().dtype, kargs().alpha));
    args.beta = addVar("beta", type,
        multiplierToString(kargs().dtype, kargs().beta));

    A = addMatrix("A", type + "*", args.N, args.N, args.lda, args.offA);
    X = addVector("X", type + "*", args.N, args.ldb, args.offBX);
    Y = addVector("Y", type + "*", args.N, args.ldc, args.offCY);
    naiveY = addVector("naiveY", type + "*", args.N, args.ldc, args.offCY);
    naiveY->setCopy(Y);

    std::string bufAName, bufBName, bufCName;
    if (NULL == masterStep) {
        bufAName = "bufA";
        bufBName = "bufX";
        bufCName = "bufY";
    }
    else {
        bufAName = masterStep->getBuffer((BufferID)(long)step_.args.A)->name();
        bufBName = masterStep->getBuffer((BufferID)(long)step_.args.B)->name();
        bufCName = masterStep->getBuffer((BufferID)(long)step_.args.C)->name();
    }
    args.A = addBuffer(BUFFER_A, bufAName, "cl_mem", CL_MEM_READ_ONLY, A);
    args.B = addBuffer(BUFFER_B, bufBName, "cl_mem", CL_MEM_READ_ONLY, X);
    args.C = addBuffer(BUFFER_C, bufCName, "cl_mem", CL_MEM_READ_WRITE, Y);

    assignKargs(args);

    std::stringstream ss;
    ss << getBlasFunctionName() << "(order, uplo, "
       << args.N->name() << ", "
       << args.alpha->name() << ", " << A->matrixPointer() << ", "
       << args.lda->name() << ", " << X->vectorPointer() << ", "
       << args.ldb->name() << ", " << args.beta->name() << ", "
       << naiveY->vectorPointer() << ", " << args.ldc->name() << ")";
    naiveCall_ = ss.str();

    ss.str("");
    ss << "compareVectors(" << args.N->name() << ", " << Y->vectorPointer()
       << ", " << naiveY->vectorPointer() << ", " << args.ldc->name() << ")";
    compareCall_ = ss.str();
}

void
SymvStep::fixLD()
{
    CLBlasKargs args;

    args = kargs();

    if (args.lda.matrix < args.N) {
        args.lda.matrix = args.N;
    }

    if (args.ldb.vector == 0) {
        args.ldb.vector = 1;
    }
    if (args.ldc.vector == 0) {
        args.ldc.vector = 1;
    }
    args.K = args.N; //store original N

    setKargs(args);
}