1 |
#include "EXTERN.h" |
2 |
#include "perl.h" |
3 |
#include "XSUB.h" |
4 |
|
5 |
#include <CL/opencl.h> |
6 |
|
7 |
typedef cl_platform_id OpenCL__Platform; |
8 |
typedef cl_device_id OpenCL__Device; |
9 |
typedef cl_context OpenCL__Context; |
10 |
typedef cl_command_queue OpenCL__Queue; |
11 |
typedef cl_mem OpenCL__Memory; |
12 |
typedef cl_mem OpenCL__Buffer; |
13 |
typedef cl_mem OpenCL__Image; |
14 |
typedef cl_mem OpenCL__Image2D; |
15 |
typedef cl_mem OpenCL__Image3D; |
16 |
typedef cl_mem OpenCL__Memory_ornull; |
17 |
typedef cl_mem OpenCL__Buffer_ornull; |
18 |
typedef cl_mem OpenCL__Image_ornull; |
19 |
typedef cl_mem OpenCL__Image2D_ornull; |
20 |
typedef cl_mem OpenCL__Image3D_ornull; |
21 |
typedef cl_sampler OpenCL__Sampler; |
22 |
typedef cl_program OpenCL__Program; |
23 |
typedef cl_kernel OpenCL__Kernel; |
24 |
typedef cl_event OpenCL__Event; |
25 |
|
26 |
typedef struct |
27 |
{ |
28 |
IV iv; |
29 |
const char *name; |
30 |
#define const_iv(name) { (IV)CL_ ## name, # name }, |
31 |
} ivstr; |
32 |
|
33 |
static const char * |
34 |
iv2str (IV value, const ivstr *base, int count, const char *fallback) |
35 |
{ |
36 |
int i; |
37 |
static char strbuf [32]; |
38 |
|
39 |
for (i = count; i--; ) |
40 |
if (base [i].iv == value) |
41 |
return base [i].name; |
42 |
|
43 |
snprintf (strbuf, sizeof (strbuf), fallback, (int)value); |
44 |
|
45 |
return strbuf; |
46 |
} |
47 |
|
48 |
static const char * |
49 |
enum2str (cl_uint value) |
50 |
{ |
51 |
static const ivstr enumstr[] = { |
52 |
#include "enumstr.h" |
53 |
}; |
54 |
|
55 |
return iv2str (value, enumstr, sizeof (enumstr) / sizeof (enumstr [0]), "ENUM(0x%04x)"); |
56 |
} |
57 |
|
58 |
static const char * |
59 |
err2str (cl_int err) |
60 |
{ |
61 |
static const ivstr errstr[] = { |
62 |
#include "errstr.h" |
63 |
}; |
64 |
|
65 |
return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)"); |
66 |
} |
67 |
|
68 |
#define FAIL(name,res) \ |
69 |
croak ("cl" # name ": %s", err2str (res)); |
70 |
|
71 |
#define NEED_SUCCESS(name,args) \ |
72 |
do { \ |
73 |
cl_int res = cl ## name args; \ |
74 |
\ |
75 |
if (res) \ |
76 |
FAIL (name, res); \ |
77 |
} while (0) |
78 |
|
79 |
#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr) |
80 |
#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr)) |
81 |
|
82 |
/*TODO*/ |
83 |
#define EVENT_LIST(items,count) cl_uint event_list_count = 0; cl_event *event_list_ptr = 0 |
84 |
|
85 |
#define INFO(class) \ |
86 |
{ \ |
87 |
size_t size; \ |
88 |
SV *sv; \ |
89 |
\ |
90 |
NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \ |
91 |
sv = sv_2mortal (newSV (size)); \ |
92 |
SvUPGRADE (sv, SVt_PV); \ |
93 |
SvPOK_only (sv); \ |
94 |
SvCUR_set (sv, size); \ |
95 |
NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \ |
96 |
XPUSHs (sv); \ |
97 |
} |
98 |
|
99 |
static void * |
100 |
SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg) |
101 |
{ |
102 |
if (SvROK (sv) && sv_derived_from (sv, pkg)) |
103 |
return (void *)SvIV (SvRV (sv)); |
104 |
|
105 |
croak ("%s: %s is not of type %s", func, svname, pkg); |
106 |
} |
107 |
|
108 |
static void * |
109 |
tmpbuf (size_t size) |
110 |
{ |
111 |
static void *buf; |
112 |
static size_t len; |
113 |
|
114 |
if (len < size) |
115 |
{ |
116 |
free (buf); |
117 |
len = ((size + 31) & ~4095) + 4096 - 32; |
118 |
buf = malloc (len); |
119 |
} |
120 |
|
121 |
return buf; |
122 |
} |
123 |
|
124 |
MODULE = OpenCL PACKAGE = OpenCL |
125 |
|
126 |
PROTOTYPES: ENABLE |
127 |
|
128 |
BOOT: |
129 |
{ |
130 |
HV *stash = gv_stashpv ("OpenCL", 1); |
131 |
static const ivstr *civ, const_iv[] = { |
132 |
{ sizeof (cl_char ), "SIZEOF_CHAR" }, |
133 |
{ sizeof (cl_uchar ), "SIZEOF_UCHAR" }, |
134 |
{ sizeof (cl_short ), "SIZEOF_SHORT" }, |
135 |
{ sizeof (cl_ushort), "SIZEOF_USHORT"}, |
136 |
{ sizeof (cl_int ), "SIZEOF_INT" }, |
137 |
{ sizeof (cl_uint ), "SIZEOF_UINT" }, |
138 |
{ sizeof (cl_long ), "SIZEOF_LONG" }, |
139 |
{ sizeof (cl_ulong ), "SIZEOF_ULONG" }, |
140 |
{ sizeof (cl_half ), "SIZEOF_HALF" }, |
141 |
{ sizeof (cl_float ), "SIZEOF_FLOAT" }, |
142 |
#include "constiv.h" |
143 |
}; |
144 |
for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--) |
145 |
newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv)); |
146 |
} |
147 |
|
148 |
const char * |
149 |
err2str (cl_int err) |
150 |
|
151 |
const char * |
152 |
enum2str (cl_uint value) |
153 |
|
154 |
void |
155 |
platforms () |
156 |
PPCODE: |
157 |
{ |
158 |
cl_platform_id *list; |
159 |
cl_uint count; |
160 |
int i; |
161 |
|
162 |
NEED_SUCCESS (GetPlatformIDs, (0, 0, &count)); |
163 |
list = tmpbuf (sizeof (*list) * count); |
164 |
NEED_SUCCESS (GetPlatformIDs, (count, list, 0)); |
165 |
|
166 |
EXTEND (SP, count); |
167 |
for (i = 0; i < count; ++i) |
168 |
PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i])); |
169 |
} |
170 |
|
171 |
void |
172 |
context_from_type_simple (cl_device_type type = CL_DEVICE_TYPE_DEFAULT) |
173 |
PPCODE: |
174 |
{ |
175 |
cl_int res; |
176 |
cl_context ctx = clCreateContextFromType (0, type, 0, 0, &res); |
177 |
|
178 |
if (res) |
179 |
FAIL (CreateContextFromType, res); |
180 |
|
181 |
XPUSH_NEW_OBJ ("OpenCL::Context", ctx); |
182 |
} |
183 |
|
184 |
void |
185 |
wait_for_events (...) |
186 |
CODE: |
187 |
{ |
188 |
EVENT_LIST (0, items); |
189 |
NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr)); |
190 |
} |
191 |
|
192 |
PROTOTYPES: DISABLE |
193 |
|
194 |
MODULE = OpenCL PACKAGE = OpenCL::Platform |
195 |
|
196 |
void |
197 |
info (OpenCL::Platform this, cl_platform_info name) |
198 |
PPCODE: |
199 |
INFO (Platform) |
200 |
|
201 |
void |
202 |
devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL) |
203 |
PPCODE: |
204 |
{ |
205 |
cl_device_id *list; |
206 |
cl_uint count; |
207 |
int i; |
208 |
|
209 |
NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count)); |
210 |
list = tmpbuf (sizeof (*list) * count); |
211 |
NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0)); |
212 |
|
213 |
EXTEND (SP, count); |
214 |
for (i = 0; i < count; ++i) |
215 |
PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i])); |
216 |
} |
217 |
|
218 |
void |
219 |
context_from_type_simple (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_DEFAULT) |
220 |
PPCODE: |
221 |
{ |
222 |
cl_int res; |
223 |
cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 }; |
224 |
cl_context ctx = clCreateContextFromType (props, type, 0, 0, &res); |
225 |
|
226 |
if (res) |
227 |
FAIL (CreateContextFromType, res); |
228 |
|
229 |
XPUSH_NEW_OBJ ("OpenCL::Context", ctx); |
230 |
} |
231 |
|
232 |
MODULE = OpenCL PACKAGE = OpenCL::Device |
233 |
|
234 |
void |
235 |
info (OpenCL::Device this, cl_device_info name) |
236 |
PPCODE: |
237 |
INFO (Device) |
238 |
|
239 |
void |
240 |
context_simple (OpenCL::Device this) |
241 |
PPCODE: |
242 |
{ |
243 |
cl_int res; |
244 |
cl_context ctx = clCreateContext (0, 1, &this, 0, 0, &res); |
245 |
|
246 |
if (res) |
247 |
FAIL (CreateContext, res); |
248 |
|
249 |
XPUSH_NEW_OBJ ("OpenCL::Context", ctx); |
250 |
} |
251 |
|
252 |
MODULE = OpenCL PACKAGE = OpenCL::Context |
253 |
|
254 |
void |
255 |
DESTROY (OpenCL::Context context) |
256 |
CODE: |
257 |
clReleaseContext (context); |
258 |
|
259 |
void |
260 |
info (OpenCL::Context this, cl_context_info name) |
261 |
PPCODE: |
262 |
INFO (Context) |
263 |
|
264 |
void |
265 |
command_queue_simple (OpenCL::Context this, OpenCL::Device device) |
266 |
PPCODE: |
267 |
{ |
268 |
cl_int res; |
269 |
cl_command_queue queue = clCreateCommandQueue (this, device, 0, &res); |
270 |
|
271 |
if (res) |
272 |
FAIL (CreateCommandQueue, res); |
273 |
|
274 |
XPUSH_NEW_OBJ ("OpenCL::Queue", queue); |
275 |
} |
276 |
|
277 |
void |
278 |
buffer (OpenCL::Context this, cl_mem_flags flags, size_t len) |
279 |
PPCODE: |
280 |
{ |
281 |
cl_int res; |
282 |
cl_mem mem; |
283 |
|
284 |
if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)) |
285 |
croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?"); |
286 |
|
287 |
mem = clCreateBuffer (this, flags, len, 0, &res); |
288 |
|
289 |
if (res) |
290 |
FAIL (CreateBuffer, res); |
291 |
|
292 |
XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); |
293 |
} |
294 |
|
295 |
void |
296 |
buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data) |
297 |
PPCODE: |
298 |
{ |
299 |
STRLEN len; |
300 |
char *ptr = SvPVbyte (data, len); |
301 |
cl_int res; |
302 |
cl_mem mem; |
303 |
|
304 |
if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) |
305 |
croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?"); |
306 |
|
307 |
mem = clCreateBuffer (this, flags, len, ptr, &res); |
308 |
|
309 |
if (res) |
310 |
FAIL (CreateBuffer, res); |
311 |
|
312 |
XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); |
313 |
} |
314 |
|
315 |
void |
316 |
image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, SV *data) |
317 |
PPCODE: |
318 |
{ |
319 |
STRLEN len; |
320 |
char *ptr = SvPVbyte (data, len); |
321 |
const cl_image_format format = { channel_order, channel_type }; |
322 |
cl_int res; |
323 |
cl_mem mem = clCreateImage2D (this, flags, &format, width, height, len / height, ptr, &res); |
324 |
|
325 |
if (res) |
326 |
FAIL (CreateImage2D, res); |
327 |
|
328 |
XPUSH_NEW_OBJ ("OpenCL::Image2D", mem); |
329 |
} |
330 |
|
331 |
void |
332 |
image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t slice_pitch, SV *data) |
333 |
PPCODE: |
334 |
{ |
335 |
STRLEN len; |
336 |
char *ptr = SvPVbyte (data, len); |
337 |
const cl_image_format format = { channel_order, channel_type }; |
338 |
cl_int res; |
339 |
cl_mem mem = clCreateImage3D (this, flags, &format, width, height, |
340 |
depth, len / (height * slice_pitch), slice_pitch, ptr, &res); |
341 |
|
342 |
if (res) |
343 |
FAIL (CreateImage3D, res); |
344 |
|
345 |
XPUSH_NEW_OBJ ("OpenCL::Image3D", mem); |
346 |
} |
347 |
|
348 |
void |
349 |
supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type) |
350 |
PPCODE: |
351 |
{ |
352 |
cl_uint count; |
353 |
cl_image_format *list; |
354 |
int i; |
355 |
|
356 |
NEED_SUCCESS (GetSupportedImageFormats, (this, flags, image_type, 0, 0, &count)); |
357 |
Newx (list, count, cl_image_format); |
358 |
NEED_SUCCESS (GetSupportedImageFormats, (this, flags, image_type, count, list, 0)); |
359 |
|
360 |
EXTEND (SP, count); |
361 |
for (i = 0; i < count; ++i) |
362 |
{ |
363 |
AV *av = newAV (); |
364 |
av_store (av, 1, newSVuv (list [i].image_channel_data_type)); |
365 |
av_store (av, 0, newSVuv (list [i].image_channel_order)); |
366 |
PUSHs (sv_2mortal (newRV_noinc ((SV *)av))); |
367 |
} |
368 |
} |
369 |
|
370 |
void |
371 |
sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode) |
372 |
PPCODE: |
373 |
{ |
374 |
cl_int res; |
375 |
cl_sampler sampler = clCreateSampler (this, normalized_coords, addressing_mode, filter_mode, &res); |
376 |
|
377 |
if (res) |
378 |
FAIL (CreateSampler, res); |
379 |
|
380 |
XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler); |
381 |
} |
382 |
|
383 |
void |
384 |
program_with_source (OpenCL::Context this, SV *program) |
385 |
PPCODE: |
386 |
{ |
387 |
STRLEN len; |
388 |
size_t len2; |
389 |
const char *ptr = SvPVbyte (program, len); |
390 |
cl_int res; |
391 |
cl_program prog; |
392 |
|
393 |
len2 = len; |
394 |
prog = clCreateProgramWithSource (this, 1, &ptr, &len2, &res); |
395 |
|
396 |
if (res) |
397 |
FAIL (CreateProgramWithSource, res); |
398 |
|
399 |
XPUSH_NEW_OBJ ("OpenCL::Program", prog); |
400 |
} |
401 |
|
402 |
MODULE = OpenCL PACKAGE = OpenCL::Queue |
403 |
|
404 |
void |
405 |
DESTROY (OpenCL::Queue this) |
406 |
CODE: |
407 |
clReleaseCommandQueue (this); |
408 |
|
409 |
void |
410 |
info (OpenCL::Queue this, cl_command_queue_info name) |
411 |
PPCODE: |
412 |
INFO (CommandQueue) |
413 |
|
414 |
void |
415 |
enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...) |
416 |
PPCODE: |
417 |
{ |
418 |
cl_event ev = 0; |
419 |
EVENT_LIST (6, items - 6); |
420 |
|
421 |
SvUPGRADE (data, SVt_PV); |
422 |
SvGROW (data, len); |
423 |
SvPOK_only (data); |
424 |
SvCUR_set (data, len); |
425 |
NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
426 |
|
427 |
if (ev) |
428 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
429 |
} |
430 |
|
431 |
void |
432 |
enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...) |
433 |
PPCODE: |
434 |
{ |
435 |
cl_event ev = 0; |
436 |
STRLEN len; |
437 |
char *ptr = SvPVbyte (data, len); |
438 |
EVENT_LIST (5, items - 5); |
439 |
|
440 |
NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
441 |
|
442 |
if (ev) |
443 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
444 |
} |
445 |
|
446 |
void |
447 |
enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...) |
448 |
PPCODE: |
449 |
{ |
450 |
cl_event ev = 0; |
451 |
EVENT_LIST (6, items - 6); |
452 |
|
453 |
NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
454 |
|
455 |
if (ev) |
456 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
457 |
} |
458 |
|
459 |
/*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueReadBufferRect.html */ |
460 |
/*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWriteBufferRect.html */ |
461 |
|
462 |
void |
463 |
enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...) |
464 |
PPCODE: |
465 |
{ |
466 |
cl_event ev = 0; |
467 |
const size_t src_origin[3] = { src_x, src_y, src_z }; |
468 |
const size_t region[3] = { width, height, depth }; |
469 |
size_t len = row_pitch * slice_pitch * depth; |
470 |
EVENT_LIST (11, items - 11); |
471 |
|
472 |
SvUPGRADE (data, SVt_PV); |
473 |
SvGROW (data, len); |
474 |
SvPOK_only (data); |
475 |
SvCUR_set (data, len); |
476 |
NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
477 |
|
478 |
if (ev) |
479 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
480 |
} |
481 |
|
482 |
void |
483 |
enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, SV *data, ...) |
484 |
PPCODE: |
485 |
{ |
486 |
cl_event ev = 0; |
487 |
const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; |
488 |
const size_t region[3] = { width, height, depth }; |
489 |
STRLEN len; |
490 |
char *ptr = SvPVbyte (data, len); |
491 |
size_t slice_pitch = len / (row_pitch * height); |
492 |
EVENT_LIST (11, items - 11); |
493 |
|
494 |
NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
495 |
|
496 |
if (ev) |
497 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
498 |
} |
499 |
|
500 |
void |
501 |
enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...) |
502 |
PPCODE: |
503 |
{ |
504 |
cl_event ev = 0; |
505 |
const size_t src_origin[3] = { src_x, src_y, src_z }; |
506 |
const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; |
507 |
const size_t region[3] = { width, height, depth }; |
508 |
EVENT_LIST (16, items - 16); |
509 |
|
510 |
NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
511 |
|
512 |
if (ev) |
513 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
514 |
} |
515 |
|
516 |
void |
517 |
enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) |
518 |
PPCODE: |
519 |
{ |
520 |
cl_event ev = 0; |
521 |
const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; |
522 |
const size_t region[3] = { width, height, depth }; |
523 |
EVENT_LIST (10, items - 10); |
524 |
|
525 |
NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
526 |
|
527 |
if (ev) |
528 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
529 |
} |
530 |
|
531 |
void |
532 |
enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) |
533 |
PPCODE: |
534 |
{ |
535 |
cl_event ev = 0; |
536 |
const size_t src_origin[3] = { src_x, src_y, src_z }; |
537 |
const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; |
538 |
const size_t region[3] = { width, height, depth }; |
539 |
EVENT_LIST (12, items - 12); |
540 |
|
541 |
NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
542 |
|
543 |
if (ev) |
544 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
545 |
} |
546 |
|
547 |
void |
548 |
enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...) |
549 |
PPCODE: |
550 |
{ |
551 |
cl_event ev = 0; |
552 |
const size_t src_origin[3] = { src_x, src_y, src_z }; |
553 |
const size_t region[3] = { width, height, depth }; |
554 |
EVENT_LIST (10, items - 10); |
555 |
|
556 |
NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
557 |
|
558 |
if (ev) |
559 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
560 |
} |
561 |
|
562 |
void |
563 |
enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...) |
564 |
PPCODE: |
565 |
{ |
566 |
cl_event ev = 0; |
567 |
EVENT_LIST (2, items - 2); |
568 |
|
569 |
NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
570 |
|
571 |
if (ev) |
572 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
573 |
} |
574 |
|
575 |
void |
576 |
enqueue_nd_range_kernel (OpenCL::Queue this, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...) |
577 |
PPCODE: |
578 |
{ |
579 |
cl_event ev = 0; |
580 |
size_t *gwo = 0, *gws, *lws = 0; |
581 |
int gws_len; |
582 |
size_t *lists; |
583 |
int i; |
584 |
EVENT_LIST (2, items - 2); |
585 |
|
586 |
if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV) |
587 |
croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference"); |
588 |
|
589 |
gws_len = AvFILLp (SvRV (global_work_size)) + 1; |
590 |
|
591 |
lists = tmpbuf (sizeof (size_t) * 3 * gws_len); |
592 |
|
593 |
gws = lists + gws_len * 0; |
594 |
for (i = 0; i < gws_len; ++i) |
595 |
gws [i] = SvIV (AvARRAY (SvRV (global_work_size))[i]); |
596 |
|
597 |
if (SvOK (global_work_offset)) |
598 |
{ |
599 |
if (!SvROK (global_work_offset) || SvTYPE (SvRV (global_work_offset)) != SVt_PVAV) |
600 |
croak ("clEnqueueNDRangeKernel: global_work_offset must be undef or an array reference"); |
601 |
|
602 |
if (AvFILLp (SvRV (global_work_size)) + 1 != gws_len) |
603 |
croak ("clEnqueueNDRangeKernel: global_work_offset must be undef or an array of same size as global_work_size"); |
604 |
|
605 |
gwo = lists + gws_len * 1; |
606 |
for (i = 0; i < gws_len; ++i) |
607 |
gwo [i] = SvIV (AvARRAY (SvRV (global_work_offset))[i]); |
608 |
} |
609 |
|
610 |
if (SvOK (local_work_size)) |
611 |
{ |
612 |
if (SvOK (local_work_size) && !SvROK (local_work_size) || SvTYPE (SvRV (local_work_size)) != SVt_PVAV) |
613 |
croak ("clEnqueueNDRangeKernel: global_work_size must be undef or an array reference"); |
614 |
|
615 |
if (AvFILLp (SvRV (local_work_size)) + 1 != gws_len) |
616 |
croak ("clEnqueueNDRangeKernel: local_work_local must be undef or an array of same size as global_work_size"); |
617 |
|
618 |
lws = lists + gws_len * 2; |
619 |
for (i = 0; i < gws_len; ++i) |
620 |
lws [i] = SvIV (AvARRAY (SvRV (local_work_size))[i]); |
621 |
} |
622 |
|
623 |
NEED_SUCCESS (EnqueueNDRangeKernel, (this, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
624 |
|
625 |
if (ev) |
626 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
627 |
} |
628 |
|
629 |
void |
630 |
enqueue_marker (OpenCL::Queue this) |
631 |
PPCODE: |
632 |
{ |
633 |
cl_event ev; |
634 |
NEED_SUCCESS (EnqueueMarker, (this, &ev)); |
635 |
XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
636 |
} |
637 |
|
638 |
void |
639 |
enqueue_wait_for_events (OpenCL::Queue this, ...) |
640 |
CODE: |
641 |
{ |
642 |
EVENT_LIST (1, items - 1); |
643 |
NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr)); |
644 |
} |
645 |
|
646 |
void |
647 |
enqueue_barrier (OpenCL::Queue this) |
648 |
CODE: |
649 |
NEED_SUCCESS (EnqueueBarrier, (this)); |
650 |
|
651 |
void |
652 |
flush (OpenCL::Queue this) |
653 |
CODE: |
654 |
NEED_SUCCESS (Flush, (this)); |
655 |
|
656 |
void |
657 |
finish (OpenCL::Queue this) |
658 |
CODE: |
659 |
NEED_SUCCESS (Finish, (this)); |
660 |
|
661 |
MODULE = OpenCL PACKAGE = OpenCL::Memory |
662 |
|
663 |
void |
664 |
DESTROY (OpenCL::Memory this) |
665 |
CODE: |
666 |
clReleaseMemObject (this); |
667 |
|
668 |
void |
669 |
info (OpenCL::Memory this, cl_mem_info name) |
670 |
PPCODE: |
671 |
INFO (MemObject) |
672 |
|
673 |
MODULE = OpenCL PACKAGE = OpenCL::Sampler |
674 |
|
675 |
void |
676 |
DESTROY (OpenCL::Sampler this) |
677 |
CODE: |
678 |
clReleaseSampler (this); |
679 |
|
680 |
void |
681 |
info (OpenCL::Sampler this, cl_sampler_info name) |
682 |
PPCODE: |
683 |
INFO (Sampler) |
684 |
|
685 |
MODULE = OpenCL PACKAGE = OpenCL::Program |
686 |
|
687 |
void |
688 |
DESTROY (OpenCL::Program this) |
689 |
CODE: |
690 |
clReleaseProgram (this); |
691 |
|
692 |
void |
693 |
info (OpenCL::Program this, cl_program_info name) |
694 |
PPCODE: |
695 |
INFO (Program) |
696 |
|
697 |
void |
698 |
build (OpenCL::Program this, OpenCL::Device device, SV *options = &PL_sv_undef) |
699 |
CODE: |
700 |
NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0)); |
701 |
|
702 |
void |
703 |
build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name) |
704 |
PPCODE: |
705 |
{ |
706 |
size_t size; |
707 |
SV *sv; |
708 |
|
709 |
NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size)); |
710 |
sv = sv_2mortal (newSV (size)); |
711 |
SvUPGRADE (sv, SVt_PV); |
712 |
SvPOK_only (sv); |
713 |
SvCUR_set (sv, size); |
714 |
NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0)); |
715 |
XPUSHs (sv); |
716 |
} |
717 |
|
718 |
void |
719 |
kernel (OpenCL::Program program, SV *function) |
720 |
PPCODE: |
721 |
{ |
722 |
cl_int res; |
723 |
cl_kernel kernel = clCreateKernel (program, SvPVbyte_nolen (function), &res); |
724 |
|
725 |
if (res) |
726 |
FAIL (CreateKernel, res); |
727 |
|
728 |
XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel); |
729 |
} |
730 |
|
731 |
MODULE = OpenCL PACKAGE = OpenCL::Kernel |
732 |
|
733 |
void |
734 |
DESTROY (OpenCL::Kernel this) |
735 |
CODE: |
736 |
clReleaseKernel (this); |
737 |
|
738 |
void |
739 |
info (OpenCL::Kernel this, cl_kernel_info name) |
740 |
PPCODE: |
741 |
INFO (Kernel) |
742 |
|
743 |
void |
744 |
set_char (OpenCL::Kernel this, cl_uint idx, cl_char value) |
745 |
CODE: |
746 |
clSetKernelArg (this, idx, sizeof (value), &value); |
747 |
|
748 |
void |
749 |
set_uchar (OpenCL::Kernel this, cl_uint idx, cl_uchar value) |
750 |
CODE: |
751 |
clSetKernelArg (this, idx, sizeof (value), &value); |
752 |
|
753 |
void |
754 |
set_short (OpenCL::Kernel this, cl_uint idx, cl_short value) |
755 |
CODE: |
756 |
clSetKernelArg (this, idx, sizeof (value), &value); |
757 |
|
758 |
void |
759 |
set_ushort (OpenCL::Kernel this, cl_uint idx, cl_ushort value) |
760 |
CODE: |
761 |
clSetKernelArg (this, idx, sizeof (value), &value); |
762 |
|
763 |
void |
764 |
set_int (OpenCL::Kernel this, cl_uint idx, cl_int value) |
765 |
CODE: |
766 |
clSetKernelArg (this, idx, sizeof (value), &value); |
767 |
|
768 |
void |
769 |
set_uint (OpenCL::Kernel this, cl_uint idx, cl_uint value) |
770 |
CODE: |
771 |
clSetKernelArg (this, idx, sizeof (value), &value); |
772 |
|
773 |
void |
774 |
set_long (OpenCL::Kernel this, cl_uint idx, cl_long value) |
775 |
CODE: |
776 |
clSetKernelArg (this, idx, sizeof (value), &value); |
777 |
|
778 |
void |
779 |
set_ulong (OpenCL::Kernel this, cl_uint idx, cl_ulong value) |
780 |
CODE: |
781 |
clSetKernelArg (this, idx, sizeof (value), &value); |
782 |
|
783 |
void |
784 |
set_half (OpenCL::Kernel this, cl_uint idx, cl_half value) |
785 |
CODE: |
786 |
clSetKernelArg (this, idx, sizeof (value), &value); |
787 |
|
788 |
void |
789 |
set_float (OpenCL::Kernel this, cl_uint idx, cl_float value) |
790 |
CODE: |
791 |
clSetKernelArg (this, idx, sizeof (value), &value); |
792 |
|
793 |
void |
794 |
set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value) |
795 |
CODE: |
796 |
clSetKernelArg (this, idx, sizeof (value), &value); |
797 |
|
798 |
void |
799 |
set_buffer (OpenCL::Kernel this, cl_uint idx, OpenCL::Buffer_ornull value) |
800 |
CODE: |
801 |
clSetKernelArg (this, idx, sizeof (value), &value); |
802 |
|
803 |
void |
804 |
set_image2d (OpenCL::Kernel this, cl_uint idx, OpenCL::Image2D_ornull value) |
805 |
CODE: |
806 |
clSetKernelArg (this, idx, sizeof (value), &value); |
807 |
|
808 |
void |
809 |
set_image3d (OpenCL::Kernel this, cl_uint idx, OpenCL::Image3D_ornull value) |
810 |
CODE: |
811 |
clSetKernelArg (this, idx, sizeof (value), &value); |
812 |
|
813 |
void |
814 |
set_sampler (OpenCL::Kernel this, cl_uint idx, OpenCL::Sampler value) |
815 |
CODE: |
816 |
clSetKernelArg (this, idx, sizeof (value), &value); |
817 |
|
818 |
void |
819 |
set_event (OpenCL::Kernel this, cl_uint idx, OpenCL::Event value) |
820 |
CODE: |
821 |
clSetKernelArg (this, idx, sizeof (value), &value); |
822 |
|
823 |
MODULE = OpenCL PACKAGE = OpenCL::Event |
824 |
|
825 |
void |
826 |
DESTROY (OpenCL::Event this) |
827 |
CODE: |
828 |
clReleaseEvent (this); |
829 |
|
830 |
void |
831 |
info (OpenCL::Event this, cl_event_info name) |
832 |
PPCODE: |
833 |
INFO (Event) |
834 |
|
835 |
void |
836 |
wait (OpenCL::Event this) |
837 |
CODE: |
838 |
clWaitForEvents (1, &this); |
839 |
|