-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathKernelHelper.cpp
260 lines (210 loc) · 6.62 KB
/
KernelHelper.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
/*
* Created on: May 27, 2013
* Author: Mirko Myllykoski (mirko.myllykoski@gmail.com)
*/
#include <fstream>
#include <streambuf>
#include "common.h"
#include "DeviceInformation.h"
#include "KernelHelper.h"
using namespace pscrCL;
const std::string errorLocation = errorMsgBegin + " / ";
const std::string debugLocation = debugMsgBegin + " / ";
KernelHelper::KernelHelper(
cl::Context &_context,
cl::Device &_device,
const PscrCLMode &_mode) :
context(_context), device(_device), mode(_mode) {
compiled = false;
// Pre-initialization checks
if((mode.precDouble()) &&
!DeviceInformation::hasDoublePrecisionSupport(device)) {
std::cerr << errorLocation <<
"KernelHelper::KernelHelper: OpenCL device does not " \
"have a double precision support." << std::endl;
throw OpenCLError();
}
}
bool KernelHelper::isCompiled() const {
return compiled;
}
void KernelHelper::compileSource(
const Optimizer& _optimizer,
const OptValues& _optValues,
const std::string& _optionalArgs,
const cl::Program::Sources& _sources) {
#if FULL_DEBUG
std::cout << debugLocation <<
"KernelHelper::compileSource: Compiling cl-source files..." <<
std::endl;
Timer timer;
timer.begin();
#endif
cl_int err;
// Creates a new opencl program-object
cl::Program program = cl::Program(context, _sources, &err);
if(err != CL_SUCCESS) {
std::cerr << errorLocation <<
"Cannot create program object." << std::endl;
throw OpenCLError(err);
}
// Builds opencl program
std::vector<cl::Device> tmpDevices;
tmpDevices.push_back(device);
std::string compilerArgs =
"-D DOUBLE=" + toString(mode.precDouble() ? 1 : 0) + " " +
"-D COMPLEX=" + toString(mode.numComplex() ? 1 : 0) + " " +
"-cl-std=CL1.2 " +
(mode.precFloat() ? "-cl-single-precision-constant " : "") +
_optionalArgs +
_optimizer.getCompilerArgs(_optValues);
#if FULL_DEBUG
std::cout << debugLocation <<
"KernelHelper::compileSource: Compiler arguments: " <<
compilerArgs << std::endl;
#endif
err = program.build(tmpDevices, compilerArgs.c_str());
if(err == -9999)
std::cout << toString(compilerArgs) << std::endl;
#if !FULL_DEBUG
if(err != CL_SUCCESS) {
#endif
std::string log;
program.getBuildInfo(device, CL_PROGRAM_BUILD_LOG, &log);
if(err != CL_SUCCESS) {
std::cerr << errorLocation <<
"KernelHelper::compileSource: OpenCL compiler output:" <<
std::endl << log << std::endl <<
errorLocation << "Cannot build program-object. " <<
CLErrorMessage(err) << std::endl;
throw OpenCLError(err);
} else {
std::cout << debugLocation <<
"KernelHelper::compileSource: OpenCL compiler output:" <<
std::endl << log;
}
#if !FULL_DEBUG
}
#endif
std::vector<cl::Kernel> kernelVector;
err = program.createKernels(&kernelVector);
if(err != CL_SUCCESS) {
std::cerr << errorLocation <<
"KernelHelper::compileSource: Cannot create kernels. " <<
CLErrorMessage(err) << std::endl;
throw OpenCLError(err);
}
std::vector<cl::Kernel>::const_iterator it;
for(it = kernelVector.begin(); it != kernelVector.end(); it++) {
std::string kernelName = "<unknown>";
err = it->getInfo(CL_KERNEL_FUNCTION_NAME, &kernelName);
#if FULL_DEBUG
std::cout << debugLocation <<
"KernelHelper::compileSource: Adding kernel " << kernelName <<
"." << std::endl;
#endif
if(err != CL_SUCCESS) {
std::cerr << errorLocation <<
"KernelHelper::compileSource: Cannot get kernel name. " <<
CLErrorMessage(err) << std::endl;
throw OpenCLError(err);
}
kernels.insert(std::pair<std::string, cl::Kernel>(kernelName, *it));
}
#if FULL_DEBUG
timer.end();
std::cout << debugLocation <<
"KernelHelper::compileSource: Compile time: " << timer.getTime() <<
"s." << std::endl;
#endif
compiled = true;
}
void KernelHelper::enqueueKernel(
CommandQueue& _queue,
const std::string& _kernel,
const GroupCount& _groups,
int _localSize,
const CLKernelLaunchInfo& _info) {
if(!isCompiled()) {
std::cerr << errorLocation <<
"KernelHelper::enqueueKernel: Cannot queue kernel. The source " <<
"code has not been compiled." << std::endl;
throw UnknownError();
}
#if FULL_DEBUG
std::cout << debugLocation <<
"KernelHelper::enqueueKernel: Queuing kernel " << _kernel << ", " <<
"groups: " << toString(_groups) << ", " <<
"work group size: " << _localSize;
if(_info != "")
std::cout << ", info = " << _info;
std::cout << "." << std::endl;
#endif
cl_int err;
err = _queue.enqueueNDRangeKernel(
_kernel,
getKernel(_kernel),
cl::NDRange(0,0,0),
cl::NDRange(_groups.d1*_localSize, _groups.d2, _groups.d3),
cl::NDRange(_localSize, 1, 1),
0, 0, _info);
if(err != CL_SUCCESS) {
std::cerr << errorLocation <<
"KernelHelper::enqueueKernel: Cannot queue " << _kernel << ". " <<
CLErrorMessage(err) << std::endl;
throw OpenCLError(err);
}
#if FULL_DEBUG
std::cout << debugLocation <<
"KernelHelper::enqueueKernel: Finishing..." << std::endl;
err = _queue.finish();
if(err != CL_SUCCESS) {
std::cerr << errorLocation <<
"KernelHelper::enqueueKernel: Cannot finish " << _kernel << ". " <<
CLErrorMessage(err) << std::endl;
throw OpenCLError(err);
}
#endif
}
void KernelHelper::renameKernel(
const std::string &_oldName,
const std::string &_newName) {
if(!isCompiled()) {
std::cerr << errorLocation <<
"KernelHelper::renameKernel: Cannot find " << _oldName <<
". The source code has not been compiled." << std::endl;
throw UnknownError();
}
std::map<std::string, cl::Kernel>::iterator kernelIt =
kernels.find(_oldName);
if(kernelIt == kernels.end()) {
std::cerr << errorMsgBegin <<
" / KernelHelper::renameKernel: Cannot find kernel " << _oldName <<
". Invalid kernel name." << std::endl;
throw UnknownError();
}
#if FULL_DEBUG
std::cout << debugLocation <<
"KernelHelper::renameKernel: Renaming kernel " <<
_oldName << " ==> " << _newName << "." << std::endl;
#endif
cl::Kernel kernel = kernelIt->second;
kernels.erase(kernelIt);
kernels.insert(std::pair<std::string, cl::Kernel>(_newName, kernel));
}
cl::Kernel& KernelHelper::getKernel(const std::string _kernel) {
if(!isCompiled()) {
std::cerr << errorLocation <<
"KernelHelper::getKernel: Cannot find " << _kernel <<
". The source code has not been compiled." << std::endl;
throw UnknownError();
}
std::map<std::string, cl::Kernel>::iterator kernelIt = kernels.find(_kernel);
if(kernelIt == kernels.end()) {
std::cerr << errorMsgBegin <<
" / KernelHelper::getKernel: Cannot find kernel " << _kernel <<
". Invalid kernel name." << std::endl;
throw UnknownError();
}
return kernelIt->second;
}