ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/OpenCL/OpenCL.xs
Revision: 1.43
Committed: Sat Apr 21 22:16:09 2012 UTC (12 years ago) by root
Branch: MAIN
Changes since 1.42: +7 -10 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 #include "EXTERN.h"
2 #include "perl.h"
3 #include "XSUB.h"
4
5 #ifdef I_DLFCN
6 #include <dlfcn.h>
7 #endif
8
9 // how stupid is that, the 1.2 header files define CL_VERSION_1_1,
10 // but then fail to define the api functions unless you ALSO define
11 // this. This breaks 100% of the opencl 1.1 apps, for what reason?
12 // after all, the functions are deprecated, not removed.
13 // in addition, you cannot test for this in any future-proof way.
14 // each time a new opencl version comes out, you need to make a new
15 // release.
16 #define CL_USE_DEPRECATED_OPENCL_1_1_APIS
17 #define CL_USE_DEPRECATED_OPENCL_1_2_APIS /* just guessing, you stupid idiots */
18
19 #ifdef __APPLE__
20 #include <OpenCL/opencl.h>
21 #else
22 #include <CL/opencl.h>
23 #endif
24
25 #if 0 // testing
26 #undef CL_USE_DEPRECATED_OPENCL_1_1_APIS
27 #undef CL_VERSION_1_2
28 #endif
29
30 typedef cl_platform_id OpenCL__Platform;
31 typedef cl_device_id OpenCL__Device;
32 typedef cl_context OpenCL__Context;
33 typedef cl_command_queue OpenCL__Queue;
34 typedef cl_mem OpenCL__Memory;
35 typedef cl_mem OpenCL__Buffer;
36 typedef cl_mem OpenCL__BufferObj;
37 typedef cl_mem OpenCL__Image;
38 typedef cl_mem OpenCL__Image2D;
39 typedef cl_mem OpenCL__Image3D;
40 typedef cl_mem OpenCL__Memory_ornull;
41 typedef cl_mem OpenCL__Buffer_ornull;
42 typedef cl_mem OpenCL__Image_ornull;
43 typedef cl_mem OpenCL__Image2D_ornull;
44 typedef cl_mem OpenCL__Image3D_ornull;
45 typedef cl_sampler OpenCL__Sampler;
46 typedef cl_program OpenCL__Program;
47 typedef cl_kernel OpenCL__Kernel;
48 typedef cl_event OpenCL__Event;
49 typedef cl_event OpenCL__UserEvent;
50
51 typedef SV *FUTURE;
52
53 /*****************************************************************************/
54
55 // name must include a leading underscore
56 // all of this horrors would be unneceesary if somebody wrote a proper OpenGL module
57 // for perl. doh.
58 static void *
59 glsym (const char *name)
60 {
61 void *fun = 0;
62
63 #if defined I_DLFCN && defined RTLD_DEFAULT
64 fun = dlsym (RTLD_DEFAULT, name + 1);
65 if (!fun) fun = dlsym (RTLD_DEFAULT, name);
66
67 if (!fun)
68 {
69 static void *libgl;
70 static const char *glso[] = {
71 "libGL.so.1",
72 "libGL.so.3",
73 "libGL.so.4.0",
74 "libGL.so",
75 "/usr/lib/libGL.so",
76 "/usr/X11R6/lib/libGL.1.dylib"
77 };
78 int i;
79
80 for (i = 0; !libgl && i < sizeof (glso) / sizeof (glso [0]); ++i)
81 {
82 libgl = dlopen (glso [i], RTLD_LAZY);
83 if (libgl)
84 break;
85 }
86
87 if (libgl)
88 {
89 fun = dlsym (libgl, name + 1);
90 if (!fun) fun = dlsym (libgl, name);
91 }
92 }
93 #endif
94
95 return fun;
96 }
97
98 /*****************************************************************************/
99
100 /* up to two temporary buffers */
101 static void *
102 tmpbuf (size_t size)
103 {
104 enum { buffers = 3 };
105 static int idx;
106 static void *buf [buffers];
107 static size_t len [buffers];
108
109 idx = (idx + 1) % buffers;
110
111 if (len [idx] < size)
112 {
113 free (buf [idx]);
114 len [idx] = ((size + 31) & ~4095) + 4096 - 32;
115 buf [idx] = malloc (len [idx]);
116 }
117
118 return buf [idx];
119 }
120
121 /*****************************************************************************/
122
123 typedef struct
124 {
125 IV iv;
126 const char *name;
127 #define const_iv(name) { (IV)CL_ ## name, # name },
128 } ivstr;
129
130 static const char *
131 iv2str (IV value, const ivstr *base, int count, const char *fallback)
132 {
133 int i;
134 static char strbuf [32];
135
136 for (i = count; i--; )
137 if (base [i].iv == value)
138 return base [i].name;
139
140 snprintf (strbuf, sizeof (strbuf), fallback, (int)value);
141
142 return strbuf;
143 }
144
145 static const char *
146 enum2str (cl_uint value)
147 {
148 static const ivstr enumstr[] = {
149 #include "enumstr.h"
150 };
151
152 return iv2str (value, enumstr, sizeof (enumstr) / sizeof (enumstr [0]), "ENUM(0x%04x)");
153 }
154
155 static const char *
156 err2str (cl_int err)
157 {
158 static const ivstr errstr[] = {
159 #include "errstr.h"
160 };
161
162 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)");
163 }
164
165 /*****************************************************************************/
166
167 static cl_int res;
168
169 #define FAIL(name) \
170 croak ("cl" # name ": %s", err2str (res));
171
172 #define NEED_SUCCESS(name,args) \
173 do { \
174 res = cl ## name args; \
175 \
176 if (res) \
177 FAIL (name); \
178 } while (0)
179
180 #define NEED_SUCCESS_ARG(retdecl, name, args) \
181 retdecl = cl ## name args; \
182 if (res) \
183 FAIL (name);
184
185 /*****************************************************************************/
186
187 #define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr)
188 #define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr))
189
190 static void *
191 SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
192 {
193 if (SvROK (sv) && sv_derived_from (sv, pkg))
194 return (void *)SvIV (SvRV (sv));
195
196 croak ("%s: %s is not of type %s", func, svname, pkg);
197 }
198
199 /*****************************************************************************/
200
201 static cl_context_properties *
202 SvCONTEXTPROPERTIES (const char *func, const char *svname, SV *sv, cl_context_properties *extra, int extracount)
203 {
204 if (!sv || !SvOK (sv))
205 if (extra)
206 sv = sv_2mortal (newRV_noinc ((SV *)newAV ())); // slow, but rarely used hopefully
207 else
208 return 0;
209
210 if (SvROK (sv) && SvTYPE (SvRV (sv)) == SVt_PVAV)
211 {
212 AV *av = (AV *)SvRV (sv);
213 int i, len = av_len (av) + 1;
214 cl_context_properties *p = tmpbuf (sizeof (cl_context_properties) * (len + extracount + 1));
215 cl_context_properties *l = p;
216
217 if (len & 1)
218 croak ("%s: %s is not a property list (must be even number of elements)", func, svname);
219
220 while (extracount--)
221 *l++ = *extra++;
222
223 for (i = 0; i < len; i += 2)
224 {
225 cl_context_properties t = SvIV (*av_fetch (av, i , 0));
226 SV *p_sv = *av_fetch (av, i + 1, 0);
227 cl_context_properties v = SvIV (p_sv); // code below can override
228
229 switch (t)
230 {
231 case CL_GLX_DISPLAY_KHR:
232 if (!SvOK (p_sv))
233 {
234 void *func = glsym ("_glXGetCurrentDisplay");
235 if (func)
236 v = (cl_context_properties)((void *(*)(void))func)();
237 }
238 break;
239
240 case CL_GL_CONTEXT_KHR:
241 if (!SvOK (p_sv))
242 {
243 void *func = glsym ("_glXGetCurrentContext");
244 if (func)
245 v = (cl_context_properties)((void *(*)(void))func)();
246 }
247 break;
248
249 default:
250 /* unknown property, treat as int */
251 break;
252 }
253
254 *l++ = t;
255 *l++ = v;
256 }
257
258 *l = 0;
259
260 return p;
261 }
262
263 croak ("%s: %s is not a property list (either undef or [type => value, ...])", func, svname);
264 }
265
266 /*****************************************************************************/
267
268 static size_t
269 img_row_pitch (cl_mem img)
270 {
271 size_t res;
272 clGetImageInfo (img, CL_IMAGE_ROW_PITCH, sizeof (res), &res, 0);
273 return res;
274 }
275
276 static cl_event *
277 event_list (SV **items, cl_uint *rcount)
278 {
279 cl_uint count = *rcount;
280
281 if (!count)
282 return 0;
283
284 cl_event *list = tmpbuf (sizeof (cl_event) * count);
285 int i = 0;
286
287 do
288 {
289 --count;
290 if (SvOK (items [count]))
291 list [i++] = SvPTROBJ ("clEnqueue", "wait_events", items [count], "OpenCL::Event");
292 }
293 while (count);
294
295 *rcount = i;
296
297 return i ? list : 0;
298 }
299
300 #define EVENT_LIST(items,count) \
301 cl_uint event_list_count = (count); \
302 cl_event *event_list_ptr = event_list (&ST (items), &event_list_count)
303
304 #define INFO(class) \
305 { \
306 size_t size; \
307 NEED_SUCCESS (Get ## class ## Info, (self, name, 0, 0, &size)); \
308 SV *sv = sv_2mortal (newSV (size)); \
309 SvUPGRADE (sv, SVt_PV); \
310 SvPOK_only (sv); \
311 SvCUR_set (sv, size); \
312 NEED_SUCCESS (Get ## class ## Info, (self, name, size, SvPVX (sv), 0)); \
313 XPUSHs (sv); \
314 }
315
316 MODULE = OpenCL PACKAGE = OpenCL
317
318 PROTOTYPES: ENABLE
319
320 BOOT:
321 {
322 HV *stash = gv_stashpv ("OpenCL", 1);
323 static const ivstr *civ, const_iv[] = {
324 { sizeof (cl_char ), "SIZEOF_CHAR" },
325 { sizeof (cl_uchar ), "SIZEOF_UCHAR" },
326 { sizeof (cl_short ), "SIZEOF_SHORT" },
327 { sizeof (cl_ushort), "SIZEOF_USHORT" },
328 { sizeof (cl_int ), "SIZEOF_INT" },
329 { sizeof (cl_uint ), "SIZEOF_UINT" },
330 { sizeof (cl_long ), "SIZEOF_LONG" },
331 { sizeof (cl_ulong ), "SIZEOF_ULONG" },
332 { sizeof (cl_half ), "SIZEOF_HALF" },
333 { sizeof (cl_float ), "SIZEOF_FLOAT" },
334 { sizeof (cl_double), "SIZEOF_DOUBLE" },
335 #include "constiv.h"
336 };
337 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--)
338 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv));
339 }
340
341 cl_int
342 errno ()
343 CODE:
344 RETVAL = res;
345 OUTPUT:
346 RETVAL
347
348 const char *
349 err2str (cl_int err)
350
351 const char *
352 enum2str (cl_uint value)
353
354 void
355 platforms ()
356 PPCODE:
357 cl_platform_id *list;
358 cl_uint count;
359 int i;
360
361 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count));
362 list = tmpbuf (sizeof (*list) * count);
363 NEED_SUCCESS (GetPlatformIDs, (count, list, 0));
364
365 EXTEND (SP, count);
366 for (i = 0; i < count; ++i)
367 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i]));
368
369 void
370 context_from_type (cl_context_properties *properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
371 PPCODE:
372 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (properties, type, 0, 0, &res));
373 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
374
375 #if 0
376
377 void
378 context (cl_context_properties *properties = 0, FUTURE devices, FUTURE notify = 0)
379 PPCODE:
380 /* der Gipfel der Kunst */
381
382 #endif
383
384 void
385 wait_for_events (...)
386 CODE:
387 EVENT_LIST (0, items);
388 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr));
389
390 PROTOTYPES: DISABLE
391
392 MODULE = OpenCL PACKAGE = OpenCL::Platform
393
394 void
395 info (OpenCL::Platform self, cl_platform_info name)
396 PPCODE:
397 INFO (Platform)
398
399 #BEGIN:platform
400
401 void
402 profile (OpenCL::Platform self)
403 ALIAS:
404 profile = CL_PLATFORM_PROFILE
405 version = CL_PLATFORM_VERSION
406 name = CL_PLATFORM_NAME
407 vendor = CL_PLATFORM_VENDOR
408 extensions = CL_PLATFORM_EXTENSIONS
409 PPCODE:
410 size_t size;
411 NEED_SUCCESS (GetPlatformInfo, (self, ix, 0, 0, &size));
412 char *value = tmpbuf (size);
413 NEED_SUCCESS (GetPlatformInfo, (self, ix, size, value, 0));
414 EXTEND (SP, 1);
415 const int i = 0;
416 PUSHs (sv_2mortal (newSVpv (value, 0)));
417
418 #END:platform
419
420 void
421 devices (OpenCL::Platform self, cl_device_type type = CL_DEVICE_TYPE_ALL)
422 PPCODE:
423 cl_device_id *list;
424 cl_uint count;
425 int i;
426
427 NEED_SUCCESS (GetDeviceIDs, (self, type, 0, 0, &count));
428 list = tmpbuf (sizeof (*list) * count);
429 NEED_SUCCESS (GetDeviceIDs, (self, type, count, list, 0));
430
431 EXTEND (SP, count);
432 for (i = 0; i < count; ++i)
433 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i]));
434
435 void
436 context (OpenCL::Platform self, cl_context_properties *properties = 0, SV *devices, FUTURE notify = 0)
437 PPCODE:
438 if (!SvROK (devices) || SvTYPE (SvRV (devices)) != SVt_PVAV)
439 croak ("OpenCL::Platform::context argument 'device' must be an arrayref with device objects, in call");
440
441 AV *av = (AV *)SvRV (devices);
442 cl_uint num_devices = av_len (av) + 1;
443 cl_device_id *device_list = tmpbuf (sizeof (cl_device_id) * num_devices);
444 int i;
445
446 for (i = num_devices; i--; )
447 device_list [i] = SvPTROBJ ("clCreateContext", "devices", *av_fetch (av, i, 0), "OpenCL::Device");
448
449 NEED_SUCCESS_ARG (cl_context ctx, CreateContext, (properties, num_devices, device_list, 0, 0, &res));
450 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
451
452 void
453 context_from_type (OpenCL::Platform self, SV *properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
454 PPCODE:
455 cl_context_properties extra[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)self };
456 cl_context_properties *props = SvCONTEXTPROPERTIES ("OpenCL::Platform::context_from_type", "properties", properties, extra, 2);
457 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (props, type, 0, 0, &res));
458 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
459
460 MODULE = OpenCL PACKAGE = OpenCL::Device
461
462 void
463 info (OpenCL::Device self, cl_device_info name)
464 PPCODE:
465 INFO (Device)
466
467 #BEGIN:device
468
469 void
470 type (OpenCL::Device self)
471 PPCODE:
472 cl_device_type value [1];
473 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_TYPE, sizeof (value), value, 0));
474 EXTEND (SP, 1);
475 const int i = 0;
476 PUSHs (sv_2mortal (newSViv (value [i])));
477
478 void
479 vendor_id (OpenCL::Device self)
480 ALIAS:
481 vendor_id = CL_DEVICE_VENDOR_ID
482 max_compute_units = CL_DEVICE_MAX_COMPUTE_UNITS
483 max_work_item_dimensions = CL_DEVICE_MAX_WORK_ITEM_DIMENSIONS
484 preferred_vector_width_char = CL_DEVICE_PREFERRED_VECTOR_WIDTH_CHAR
485 preferred_vector_width_short = CL_DEVICE_PREFERRED_VECTOR_WIDTH_SHORT
486 preferred_vector_width_int = CL_DEVICE_PREFERRED_VECTOR_WIDTH_INT
487 preferred_vector_width_long = CL_DEVICE_PREFERRED_VECTOR_WIDTH_LONG
488 preferred_vector_width_float = CL_DEVICE_PREFERRED_VECTOR_WIDTH_FLOAT
489 preferred_vector_width_double = CL_DEVICE_PREFERRED_VECTOR_WIDTH_DOUBLE
490 max_clock_frequency = CL_DEVICE_MAX_CLOCK_FREQUENCY
491 max_read_image_args = CL_DEVICE_MAX_READ_IMAGE_ARGS
492 max_write_image_args = CL_DEVICE_MAX_WRITE_IMAGE_ARGS
493 image_support = CL_DEVICE_IMAGE_SUPPORT
494 max_samplers = CL_DEVICE_MAX_SAMPLERS
495 mem_base_addr_align = CL_DEVICE_MEM_BASE_ADDR_ALIGN
496 min_data_type_align_size = CL_DEVICE_MIN_DATA_TYPE_ALIGN_SIZE
497 global_mem_cacheline_size = CL_DEVICE_GLOBAL_MEM_CACHELINE_SIZE
498 max_constant_args = CL_DEVICE_MAX_CONSTANT_ARGS
499 preferred_vector_width_half = CL_DEVICE_PREFERRED_VECTOR_WIDTH_HALF
500 native_vector_width_char = CL_DEVICE_NATIVE_VECTOR_WIDTH_CHAR
501 native_vector_width_short = CL_DEVICE_NATIVE_VECTOR_WIDTH_SHORT
502 native_vector_width_int = CL_DEVICE_NATIVE_VECTOR_WIDTH_INT
503 native_vector_width_long = CL_DEVICE_NATIVE_VECTOR_WIDTH_LONG
504 native_vector_width_float = CL_DEVICE_NATIVE_VECTOR_WIDTH_FLOAT
505 native_vector_width_double = CL_DEVICE_NATIVE_VECTOR_WIDTH_DOUBLE
506 native_vector_width_half = CL_DEVICE_NATIVE_VECTOR_WIDTH_HALF
507 reference_count_ext = CL_DEVICE_REFERENCE_COUNT_EXT
508 PPCODE:
509 cl_uint value [1];
510 NEED_SUCCESS (GetDeviceInfo, (self, ix, sizeof (value), value, 0));
511 EXTEND (SP, 1);
512 const int i = 0;
513 PUSHs (sv_2mortal (newSVuv (value [i])));
514
515 void
516 max_work_group_size (OpenCL::Device self)
517 ALIAS:
518 max_work_group_size = CL_DEVICE_MAX_WORK_GROUP_SIZE
519 image2d_max_width = CL_DEVICE_IMAGE2D_MAX_WIDTH
520 image2d_max_height = CL_DEVICE_IMAGE2D_MAX_HEIGHT
521 image3d_max_width = CL_DEVICE_IMAGE3D_MAX_WIDTH
522 image3d_max_height = CL_DEVICE_IMAGE3D_MAX_HEIGHT
523 image3d_max_depth = CL_DEVICE_IMAGE3D_MAX_DEPTH
524 max_parameter_size = CL_DEVICE_MAX_PARAMETER_SIZE
525 profiling_timer_resolution = CL_DEVICE_PROFILING_TIMER_RESOLUTION
526 PPCODE:
527 size_t value [1];
528 NEED_SUCCESS (GetDeviceInfo, (self, ix, sizeof (value), value, 0));
529 EXTEND (SP, 1);
530 const int i = 0;
531 PUSHs (sv_2mortal (newSVuv (value [i])));
532
533 void
534 max_work_item_sizes (OpenCL::Device self)
535 PPCODE:
536 size_t size;
537 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_MAX_WORK_ITEM_SIZES, 0, 0, &size));
538 size_t *value = tmpbuf (size);
539 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_MAX_WORK_ITEM_SIZES, size, value, 0));
540 int i, n = size / sizeof (*value);
541 EXTEND (SP, n);
542 for (i = 0; i < n; ++i)
543 PUSHs (sv_2mortal (newSVuv (value [i])));
544
545 void
546 address_bits (OpenCL::Device self)
547 PPCODE:
548 cl_bitfield value [1];
549 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_ADDRESS_BITS, sizeof (value), value, 0));
550 EXTEND (SP, 1);
551 const int i = 0;
552 PUSHs (sv_2mortal (newSVuv (value [i])));
553
554 void
555 max_mem_alloc_size (OpenCL::Device self)
556 ALIAS:
557 max_mem_alloc_size = CL_DEVICE_MAX_MEM_ALLOC_SIZE
558 global_mem_cache_size = CL_DEVICE_GLOBAL_MEM_CACHE_SIZE
559 global_mem_size = CL_DEVICE_GLOBAL_MEM_SIZE
560 max_constant_buffer_size = CL_DEVICE_MAX_CONSTANT_BUFFER_SIZE
561 local_mem_size = CL_DEVICE_LOCAL_MEM_SIZE
562 PPCODE:
563 cl_ulong value [1];
564 NEED_SUCCESS (GetDeviceInfo, (self, ix, sizeof (value), value, 0));
565 EXTEND (SP, 1);
566 const int i = 0;
567 PUSHs (sv_2mortal (newSVuv (value [i])));
568
569 void
570 single_fp_config (OpenCL::Device self)
571 ALIAS:
572 single_fp_config = CL_DEVICE_SINGLE_FP_CONFIG
573 double_fp_config = CL_DEVICE_DOUBLE_FP_CONFIG
574 half_fp_config = CL_DEVICE_HALF_FP_CONFIG
575 PPCODE:
576 cl_device_fp_config value [1];
577 NEED_SUCCESS (GetDeviceInfo, (self, ix, sizeof (value), value, 0));
578 EXTEND (SP, 1);
579 const int i = 0;
580 PUSHs (sv_2mortal (newSVuv (value [i])));
581
582 void
583 global_mem_cache_type (OpenCL::Device self)
584 PPCODE:
585 cl_device_mem_cache_type value [1];
586 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_GLOBAL_MEM_CACHE_TYPE, sizeof (value), value, 0));
587 EXTEND (SP, 1);
588 const int i = 0;
589 PUSHs (sv_2mortal (newSVuv (value [i])));
590
591 void
592 local_mem_type (OpenCL::Device self)
593 PPCODE:
594 cl_device_local_mem_type value [1];
595 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_LOCAL_MEM_TYPE, sizeof (value), value, 0));
596 EXTEND (SP, 1);
597 const int i = 0;
598 PUSHs (sv_2mortal (newSVuv (value [i])));
599
600 void
601 error_correction_support (OpenCL::Device self)
602 ALIAS:
603 error_correction_support = CL_DEVICE_ERROR_CORRECTION_SUPPORT
604 endian_little = CL_DEVICE_ENDIAN_LITTLE
605 available = CL_DEVICE_AVAILABLE
606 compiler_available = CL_DEVICE_COMPILER_AVAILABLE
607 host_unified_memory = CL_DEVICE_HOST_UNIFIED_MEMORY
608 PPCODE:
609 cl_bool value [1];
610 NEED_SUCCESS (GetDeviceInfo, (self, ix, sizeof (value), value, 0));
611 EXTEND (SP, 1);
612 const int i = 0;
613 PUSHs (sv_2mortal (value [i] ? &PL_sv_yes : &PL_sv_no));
614
615 void
616 execution_capabilities (OpenCL::Device self)
617 PPCODE:
618 cl_device_exec_capabilities value [1];
619 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_EXECUTION_CAPABILITIES, sizeof (value), value, 0));
620 EXTEND (SP, 1);
621 const int i = 0;
622 PUSHs (sv_2mortal (newSVuv (value [i])));
623
624 void
625 properties (OpenCL::Device self)
626 PPCODE:
627 cl_command_queue_properties value [1];
628 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_QUEUE_PROPERTIES, sizeof (value), value, 0));
629 EXTEND (SP, 1);
630 const int i = 0;
631 PUSHs (sv_2mortal (newSViv (value [i])));
632
633 void
634 platform (OpenCL::Device self)
635 PPCODE:
636 cl_platform_id value [1];
637 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_PLATFORM, sizeof (value), value, 0));
638 EXTEND (SP, 1);
639 const int i = 0;
640 {
641 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", value [i]));
642 }
643
644 void
645 name (OpenCL::Device self)
646 ALIAS:
647 name = CL_DEVICE_NAME
648 vendor = CL_DEVICE_VENDOR
649 driver_version = CL_DRIVER_VERSION
650 profile = CL_DEVICE_PROFILE
651 version = CL_DEVICE_VERSION
652 extensions = CL_DEVICE_EXTENSIONS
653 PPCODE:
654 size_t size;
655 NEED_SUCCESS (GetDeviceInfo, (self, ix, 0, 0, &size));
656 char *value = tmpbuf (size);
657 NEED_SUCCESS (GetDeviceInfo, (self, ix, size, value, 0));
658 EXTEND (SP, 1);
659 const int i = 0;
660 PUSHs (sv_2mortal (newSVpv (value, 0)));
661
662 void
663 parent_device_ext (OpenCL::Device self)
664 PPCODE:
665 cl_device_id value [1];
666 NEED_SUCCESS (GetDeviceInfo, (self, CL_DEVICE_PARENT_DEVICE_EXT, sizeof (value), value, 0));
667 EXTEND (SP, 1);
668 const int i = 0;
669 {
670 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Device", value [i]));
671 }
672
673 void
674 partition_types_ext (OpenCL::Device self)
675 ALIAS:
676 partition_types_ext = CL_DEVICE_PARTITION_TYPES_EXT
677 affinity_domains_ext = CL_DEVICE_AFFINITY_DOMAINS_EXT
678 partition_style_ext = CL_DEVICE_PARTITION_STYLE_EXT
679 PPCODE:
680 size_t size;
681 NEED_SUCCESS (GetDeviceInfo, (self, ix, 0, 0, &size));
682 cl_device_partition_property_ext *value = tmpbuf (size);
683 NEED_SUCCESS (GetDeviceInfo, (self, ix, size, value, 0));
684 int i, n = size / sizeof (*value);
685 EXTEND (SP, n);
686 for (i = 0; i < n; ++i)
687 PUSHs (sv_2mortal (newSVuv (value [i])));
688
689 #END:device
690
691 MODULE = OpenCL PACKAGE = OpenCL::Context
692
693 void
694 DESTROY (OpenCL::Context context)
695 CODE:
696 clReleaseContext (context);
697
698 void
699 info (OpenCL::Context self, cl_context_info name)
700 PPCODE:
701 INFO (Context)
702
703 void
704 queue (OpenCL::Context self, OpenCL::Device device, cl_command_queue_properties properties = 0)
705 PPCODE:
706 NEED_SUCCESS_ARG (cl_command_queue queue, CreateCommandQueue, (self, device, properties, &res));
707 XPUSH_NEW_OBJ ("OpenCL::Queue", queue);
708
709 void
710 user_event (OpenCL::Context self)
711 PPCODE:
712 NEED_SUCCESS_ARG (cl_event ev, CreateUserEvent, (self, &res));
713 XPUSH_NEW_OBJ ("OpenCL::UserEvent", ev);
714
715 void
716 buffer (OpenCL::Context self, cl_mem_flags flags, size_t len)
717 PPCODE:
718 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))
719 croak ("OpenCL::Context::buffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?");
720
721 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (self, flags, len, 0, &res));
722 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem);
723
724 void
725 buffer_sv (OpenCL::Context self, cl_mem_flags flags, SV *data)
726 PPCODE:
727 STRLEN len;
728 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0;
729 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)))
730 croak ("OpenCL::Context::buffer_sv: you have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?");
731 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (self, flags, len, ptr, &res));
732 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem);
733
734 #if CL_VERSION_1_2
735
736 void
737 image (OpenCL::Context self, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, cl_mem_object_type type, size_t width, size_t height, size_t depth, size_t array_size = 0, size_t row_pitch = 0, size_t slice_pitch = 0, cl_uint num_mip_level = 0, cl_uint num_samples = 0, SV *data = &PL_sv_undef)
738 PPCODE:
739 STRLEN len;
740 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0;
741 const cl_image_format format = { channel_order, channel_type };
742 const cl_image_desc desc = {
743 type,
744 width, height, depth,
745 array_size, row_pitch, slice_pitch,
746 num_mip_level, num_samples,
747 type == CL_MEM_OBJECT_IMAGE1D_BUFFER ? (cl_mem)SvPTROBJ ("OpenCL::Context::Image", "data", data, "OpenCL::Buffer") : 0
748 };
749 NEED_SUCCESS_ARG (cl_mem mem, CreateImage, (self, flags, &format, &desc, ptr, &res));
750 char *klass = "OpenCL::Image";
751 switch (type)
752 {
753 case CL_MEM_OBJECT_IMAGE1D_BUFFER: klass = "OpenCL::Image1DBuffer"; break;
754 case CL_MEM_OBJECT_IMAGE1D: klass = "OpenCL::Image1D"; break;
755 case CL_MEM_OBJECT_IMAGE1D_ARRAY: klass = "OpenCL::Image2DArray"; break;
756 case CL_MEM_OBJECT_IMAGE2D: klass = "OpenCL::Image2D"; break;
757 case CL_MEM_OBJECT_IMAGE2D_ARRAY: klass = "OpenCL::Image2DArray"; break;
758 case CL_MEM_OBJECT_IMAGE3D: klass = "OpenCL::Image3D"; break;
759 }
760 XPUSH_NEW_OBJ (klass, mem);
761
762 #endif
763
764 void
765 image2d (OpenCL::Context self, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t row_pitch = 0, SV *data = &PL_sv_undef)
766 PPCODE:
767 STRLEN len;
768 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0;
769 const cl_image_format format = { channel_order, channel_type };
770 #if CL_VERSION_1_2
771 const cl_image_desc desc = { CL_MEM_OBJECT_IMAGE2D, width, height, 0, 0, row_pitch, 0, 0, 0, 0 };
772 NEED_SUCCESS_ARG (cl_mem mem, CreateImage, (self, flags, &format, &desc, ptr, &res));
773 #else
774 NEED_SUCCESS_ARG (cl_mem mem, CreateImage2D, (self, flags, &format, width, height, row_pitch, ptr, &res));
775 #endif
776 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
777
778 void
779 image3d (OpenCL::Context self, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t row_pitch = 0, size_t slice_pitch = 0, SV *data = &PL_sv_undef)
780 PPCODE:
781 STRLEN len;
782 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0;
783 const cl_image_format format = { channel_order, channel_type };
784 #if CL_VERSION_1_2
785 const cl_image_desc desc = { CL_MEM_OBJECT_IMAGE3D, width, height, depth, 0, row_pitch, slice_pitch, 0, 0, 0 };
786 NEED_SUCCESS_ARG (cl_mem mem, CreateImage, (self, flags, &format, &desc, ptr, &res));
787 #else
788 NEED_SUCCESS_ARG (cl_mem mem, CreateImage3D, (self, flags, &format, width, height, depth, row_pitch, slice_pitch, ptr, &res));
789 #endif
790 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
791
792 #if cl_apple_gl_sharing || cl_khr_gl_sharing
793
794 void
795 gl_buffer (OpenCL::Context self, cl_mem_flags flags, cl_GLuint bufobj)
796 PPCODE:
797 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLBuffer, (self, flags, bufobj, &res));
798 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem);
799
800 void
801 gl_renderbuffer (OpenCL::Context self, cl_mem_flags flags, cl_GLuint renderbuffer)
802 PPCODE:
803 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLRenderbuffer, (self, flags, renderbuffer, &res));
804 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
805
806 #if CL_VERSION_1_2
807
808 void
809 gl_texture (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture)
810 ALIAS:
811 gl_texture2d = 0
812 gl_texture3d = 0
813 PPCODE:
814 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture, (self, flags, target, miplevel, texture, &res));
815 cl_gl_object_type type;
816 NEED_SUCCESS (GetGLObjectInfo, (mem, &type, 0)); // TODO: use target instead?
817 char *klass = "OpenCL::Memory";
818 switch (type)
819 {
820 case CL_GL_OBJECT_TEXTURE_BUFFER: klass = "OpenCL::Image1DBuffer"; break;
821 case CL_GL_OBJECT_TEXTURE1D: klass = "OpenCL::Image1D"; break;
822 case CL_GL_OBJECT_TEXTURE1D_ARRAY: klass = "OpenCL::Image2DArray"; break;
823 case CL_GL_OBJECT_TEXTURE2D: klass = "OpenCL::Image2D"; break;
824 case CL_GL_OBJECT_TEXTURE2D_ARRAY: klass = "OpenCL::Image2DArray"; break;
825 case CL_GL_OBJECT_TEXTURE3D: klass = "OpenCL::Image3D"; break;
826 }
827 XPUSH_NEW_OBJ (klass, mem);
828
829 #else
830
831 void
832 gl_texture2d (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture)
833 PPCODE:
834 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture2D, (self, flags, target, miplevel, texture, &res));
835 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
836
837 void
838 gl_texture3d (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture)
839 PPCODE:
840 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture3D, (self, flags, target, miplevel, texture, &res));
841 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
842
843 #endif
844
845 #endif
846
847 void
848 supported_image_formats (OpenCL::Context self, cl_mem_flags flags, cl_mem_object_type image_type)
849 PPCODE:
850 {
851 cl_uint count;
852 cl_image_format *list;
853 int i;
854
855 NEED_SUCCESS (GetSupportedImageFormats, (self, flags, image_type, 0, 0, &count));
856 Newx (list, count, cl_image_format);
857 NEED_SUCCESS (GetSupportedImageFormats, (self, flags, image_type, count, list, 0));
858
859 EXTEND (SP, count);
860 for (i = 0; i < count; ++i)
861 {
862 AV *av = newAV ();
863 av_store (av, 1, newSVuv (list [i].image_channel_data_type));
864 av_store (av, 0, newSVuv (list [i].image_channel_order));
865 PUSHs (sv_2mortal (newRV_noinc ((SV *)av)));
866 }
867 }
868
869 void
870 sampler (OpenCL::Context self, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode)
871 PPCODE:
872 NEED_SUCCESS_ARG (cl_sampler sampler, CreateSampler, (self, normalized_coords, addressing_mode, filter_mode, &res));
873 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler);
874
875 void
876 program_with_source (OpenCL::Context self, SV *program)
877 PPCODE:
878 STRLEN len;
879 size_t len2;
880 const char *ptr = SvPVbyte (program, len);
881
882 len2 = len;
883 NEED_SUCCESS_ARG (cl_program prog, CreateProgramWithSource, (self, 1, &ptr, &len2, &res));
884 XPUSH_NEW_OBJ ("OpenCL::Program", prog);
885
886 #BEGIN:context
887
888 void
889 reference_count (OpenCL::Context self)
890 ALIAS:
891 reference_count = CL_CONTEXT_REFERENCE_COUNT
892 num_devices = CL_CONTEXT_NUM_DEVICES
893 PPCODE:
894 cl_uint value [1];
895 NEED_SUCCESS (GetContextInfo, (self, ix, sizeof (value), value, 0));
896 EXTEND (SP, 1);
897 const int i = 0;
898 PUSHs (sv_2mortal (newSVuv (value [i])));
899
900 void
901 devices (OpenCL::Context self)
902 PPCODE:
903 size_t size;
904 NEED_SUCCESS (GetContextInfo, (self, CL_CONTEXT_DEVICES, 0, 0, &size));
905 cl_device_id *value = tmpbuf (size);
906 NEED_SUCCESS (GetContextInfo, (self, CL_CONTEXT_DEVICES, size, value, 0));
907 int i, n = size / sizeof (*value);
908 EXTEND (SP, n);
909 for (i = 0; i < n; ++i)
910 {
911 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Device", value [i]));
912 }
913
914 void
915 properties (OpenCL::Context self)
916 PPCODE:
917 size_t size;
918 NEED_SUCCESS (GetContextInfo, (self, CL_CONTEXT_PROPERTIES, 0, 0, &size));
919 cl_context_properties *value = tmpbuf (size);
920 NEED_SUCCESS (GetContextInfo, (self, CL_CONTEXT_PROPERTIES, size, value, 0));
921 int i, n = size / sizeof (*value);
922 EXTEND (SP, n);
923 for (i = 0; i < n; ++i)
924 PUSHs (sv_2mortal (newSVuv ((UV)value [i])));
925
926 #END:context
927
928 MODULE = OpenCL PACKAGE = OpenCL::Queue
929
930 void
931 DESTROY (OpenCL::Queue self)
932 CODE:
933 clReleaseCommandQueue (self);
934
935 void
936 enqueue_read_buffer (OpenCL::Queue self, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...)
937 PPCODE:
938 cl_event ev = 0;
939 EVENT_LIST (6, items - 6);
940
941 SvUPGRADE (data, SVt_PV);
942 SvGROW (data, len);
943 SvPOK_only (data);
944 SvCUR_set (data, len);
945 NEED_SUCCESS (EnqueueReadBuffer, (self, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
946
947 if (ev)
948 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
949
950 void
951 enqueue_write_buffer (OpenCL::Queue self, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...)
952 PPCODE:
953 cl_event ev = 0;
954 STRLEN len;
955 char *ptr = SvPVbyte (data, len);
956 EVENT_LIST (5, items - 5);
957
958 NEED_SUCCESS (EnqueueWriteBuffer, (self, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
959
960 if (ev)
961 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
962
963 void
964 enqueue_copy_buffer (OpenCL::Queue self, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...)
965 PPCODE:
966 cl_event ev = 0;
967 EVENT_LIST (6, items - 6);
968
969 NEED_SUCCESS (EnqueueCopyBuffer, (self, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
970
971 if (ev)
972 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
973
974 void
975 enqueue_read_buffer_rect (OpenCL::Queue self, OpenCL::Memory buf, cl_bool blocking, size_t buf_x, size_t buf_y, size_t buf_z, size_t host_x, size_t host_y, size_t host_z, size_t width, size_t height, size_t depth, size_t buf_row_pitch, size_t buf_slice_pitch, size_t host_row_pitch, size_t host_slice_pitch, SV *data, ...)
976 PPCODE:
977 cl_event ev = 0;
978 const size_t buf_origin [3] = { buf_x , buf_y , buf_z };
979 const size_t host_origin[3] = { host_x, host_y, host_z };
980 const size_t region[3] = { width, height, depth };
981 EVENT_LIST (17, items - 17);
982
983 if (!buf_row_pitch)
984 buf_row_pitch = region [0];
985
986 if (!buf_slice_pitch)
987 buf_slice_pitch = region [1] * buf_row_pitch;
988
989 if (!host_row_pitch)
990 host_row_pitch = region [0];
991
992 if (!host_slice_pitch)
993 host_slice_pitch = region [1] * host_row_pitch;
994
995 size_t len = host_row_pitch * host_slice_pitch * region [2];
996
997 SvUPGRADE (data, SVt_PV);
998 SvGROW (data, len);
999 SvPOK_only (data);
1000 SvCUR_set (data, len);
1001 NEED_SUCCESS (EnqueueReadBufferRect, (self, buf, blocking, buf_origin, host_origin, region, buf_row_pitch, buf_slice_pitch, host_row_pitch, host_slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1002
1003 if (ev)
1004 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1005
1006 void
1007 enqueue_write_buffer_rect (OpenCL::Queue self, OpenCL::Memory buf, cl_bool blocking, size_t buf_x, size_t buf_y, size_t buf_z, size_t host_x, size_t host_y, size_t host_z, size_t width, size_t height, size_t depth, size_t buf_row_pitch, size_t buf_slice_pitch, size_t host_row_pitch, size_t host_slice_pitch, SV *data, ...)
1008 PPCODE:
1009 cl_event ev = 0;
1010 const size_t buf_origin [3] = { buf_x , buf_y , buf_z };
1011 const size_t host_origin[3] = { host_x, host_y, host_z };
1012 const size_t region[3] = { width, height, depth };
1013 STRLEN len;
1014 char *ptr = SvPVbyte (data, len);
1015 EVENT_LIST (17, items - 17);
1016
1017 if (!buf_row_pitch)
1018 buf_row_pitch = region [0];
1019
1020 if (!buf_slice_pitch)
1021 buf_slice_pitch = region [1] * buf_row_pitch;
1022
1023 if (!host_row_pitch)
1024 host_row_pitch = region [0];
1025
1026 if (!host_slice_pitch)
1027 host_slice_pitch = region [1] * host_row_pitch;
1028
1029 size_t min_len = host_row_pitch * host_slice_pitch * region [2];
1030
1031 if (len < min_len)
1032 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred");
1033
1034 NEED_SUCCESS (EnqueueWriteBufferRect, (self, buf, blocking, buf_origin, host_origin, region, buf_row_pitch, buf_slice_pitch, host_row_pitch, host_slice_pitch, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1035
1036 if (ev)
1037 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1038
1039 void
1040 enqueue_copy_buffer_rect (OpenCL::Queue self, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...)
1041 PPCODE:
1042 cl_event ev = 0;
1043 const size_t src_origin[3] = { src_x, src_y, src_z };
1044 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
1045 const size_t region[3] = { width, height, depth };
1046 EVENT_LIST (16, items - 16);
1047
1048 NEED_SUCCESS (EnqueueCopyBufferRect, (self, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1049
1050 if (ev)
1051 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1052
1053 void
1054 enqueue_read_image (OpenCL::Queue self, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
1055 PPCODE:
1056 cl_event ev = 0;
1057 const size_t src_origin[3] = { src_x, src_y, src_z };
1058 const size_t region[3] = { width, height, depth };
1059 EVENT_LIST (12, items - 12);
1060
1061 if (!row_pitch)
1062 row_pitch = img_row_pitch (src);
1063
1064 if (depth > 1 && !slice_pitch)
1065 slice_pitch = row_pitch * height;
1066
1067 size_t len = slice_pitch ? slice_pitch * depth : row_pitch * height;
1068
1069 SvUPGRADE (data, SVt_PV);
1070 SvGROW (data, len);
1071 SvPOK_only (data);
1072 SvCUR_set (data, len);
1073 NEED_SUCCESS (EnqueueReadImage, (self, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1074
1075 if (ev)
1076 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1077
1078 void
1079 enqueue_write_image (OpenCL::Queue self, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
1080 PPCODE:
1081 cl_event ev = 0;
1082 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
1083 const size_t region[3] = { width, height, depth };
1084 STRLEN len;
1085 char *ptr = SvPVbyte (data, len);
1086 EVENT_LIST (12, items - 12);
1087
1088 if (!row_pitch)
1089 row_pitch = img_row_pitch (dst);
1090
1091 if (depth > 1 && !slice_pitch)
1092 slice_pitch = row_pitch * height;
1093
1094 size_t min_len = slice_pitch ? slice_pitch * depth : row_pitch * height;
1095
1096 if (len < min_len)
1097 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred");
1098
1099 NEED_SUCCESS (EnqueueWriteImage, (self, dst, blocking, dst_origin, region, row_pitch, slice_pitch, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1100
1101 if (ev)
1102 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1103
1104 void
1105 enqueue_copy_image (OpenCL::Queue self, OpenCL::Image src, OpenCL::Image dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
1106 PPCODE:
1107 cl_event ev = 0;
1108 const size_t src_origin[3] = { src_x, src_y, src_z };
1109 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
1110 const size_t region[3] = { width, height, depth };
1111 EVENT_LIST (12, items - 12);
1112
1113 NEED_SUCCESS (EnqueueCopyImage, (self, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1114
1115 if (ev)
1116 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1117
1118 void
1119 enqueue_copy_image_to_buffer (OpenCL::Queue self, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...)
1120 PPCODE:
1121 cl_event ev = 0;
1122 const size_t src_origin[3] = { src_x, src_y, src_z };
1123 const size_t region[3] = { width, height, depth };
1124 EVENT_LIST (10, items - 10);
1125
1126 NEED_SUCCESS (EnqueueCopyImageToBuffer, (self, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1127
1128 if (ev)
1129 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1130
1131 void
1132 enqueue_copy_buffer_to_image (OpenCL::Queue self, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
1133 PPCODE:
1134 cl_event ev = 0;
1135 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
1136 const size_t region[3] = { width, height, depth };
1137 EVENT_LIST (10, items - 10);
1138
1139 NEED_SUCCESS (EnqueueCopyBufferToImage, (self, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1140
1141 if (ev)
1142 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1143
1144 void
1145 enqueue_task (OpenCL::Queue self, OpenCL::Kernel kernel, ...)
1146 PPCODE:
1147 cl_event ev = 0;
1148 EVENT_LIST (2, items - 2);
1149
1150 NEED_SUCCESS (EnqueueTask, (self, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1151
1152 if (ev)
1153 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1154
1155 void
1156 enqueue_nd_range_kernel (OpenCL::Queue self, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...)
1157 PPCODE:
1158 cl_event ev = 0;
1159 size_t *gwo = 0, *gws, *lws = 0;
1160 int gws_len;
1161 size_t *lists;
1162 int i;
1163 EVENT_LIST (5, items - 5);
1164
1165 if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV)
1166 croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference");
1167
1168 gws_len = AvFILLp (SvRV (global_work_size)) + 1;
1169
1170 lists = tmpbuf (sizeof (size_t) * 3 * gws_len);
1171
1172 gws = lists + gws_len * 0;
1173 for (i = 0; i < gws_len; ++i)
1174 gws [i] = SvIV (AvARRAY (SvRV (global_work_size))[i]);
1175
1176 if (SvOK (global_work_offset))
1177 {
1178 if (!SvROK (global_work_offset) || SvTYPE (SvRV (global_work_offset)) != SVt_PVAV)
1179 croak ("clEnqueueNDRangeKernel: global_work_offset must be undef or an array reference");
1180
1181 if (AvFILLp (SvRV (global_work_size)) + 1 != gws_len)
1182 croak ("clEnqueueNDRangeKernel: global_work_offset must be undef or an array of same size as global_work_size");
1183
1184 gwo = lists + gws_len * 1;
1185 for (i = 0; i < gws_len; ++i)
1186 gwo [i] = SvIV (AvARRAY (SvRV (global_work_offset))[i]);
1187 }
1188
1189 if (SvOK (local_work_size))
1190 {
1191 if ((SvOK (local_work_size) && !SvROK (local_work_size)) || SvTYPE (SvRV (local_work_size)) != SVt_PVAV)
1192 croak ("clEnqueueNDRangeKernel: global_work_size must be undef or an array reference");
1193
1194 if (AvFILLp (SvRV (local_work_size)) + 1 != gws_len)
1195 croak ("clEnqueueNDRangeKernel: local_work_local must be undef or an array of same size as global_work_size");
1196
1197 lws = lists + gws_len * 2;
1198 for (i = 0; i < gws_len; ++i)
1199 lws [i] = SvIV (AvARRAY (SvRV (local_work_size))[i]);
1200 }
1201
1202 NEED_SUCCESS (EnqueueNDRangeKernel, (self, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1203
1204 if (ev)
1205 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1206
1207 #if cl_apple_gl_sharing || cl_khr_gl_sharing
1208
1209 void
1210 enqueue_acquire_gl_objects (OpenCL::Queue self, SV *objects, ...)
1211 ALIAS:
1212 enqueue_release_gl_objects = 1
1213 PPCODE:
1214 if (!SvROK (objects) || SvTYPE (SvRV (objects)) != SVt_PVAV)
1215 croak ("OpenCL::Queue::enqueue_acquire/release_gl_objects argument 'objects' must be an arrayref with memory objects, in call");
1216
1217 cl_event ev = 0;
1218 EVENT_LIST (2, items - 2);
1219 AV *av = (AV *)SvRV (objects);
1220 cl_uint num_objects = av_len (av) + 1;
1221 cl_mem *object_list = tmpbuf (sizeof (cl_mem) * num_objects);
1222 int i;
1223
1224 for (i = num_objects; i--; )
1225 object_list [i] = SvPTROBJ ("OpenCL::Queue::enqueue_acquire/release_gl_objects", "objects", *av_fetch (av, i, 0), "OpenCL::Memory");
1226
1227 if (ix)
1228 NEED_SUCCESS (EnqueueReleaseGLObjects, (self, num_objects, object_list, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1229 else
1230 NEED_SUCCESS (EnqueueAcquireGLObjects, (self, num_objects, object_list, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1231
1232 if (ev)
1233 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1234
1235 #endif
1236
1237 #if !CL_VERSION_1_2 || defined CL_USE_DEPRECATED_OPENCL_1_1_APIS
1238
1239 void
1240 enqueue_wait_for_events (OpenCL::Queue self, ...)
1241 CODE:
1242 EVENT_LIST (1, items - 1);
1243 NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr));
1244
1245 #endif
1246
1247 void
1248 enqueue_marker (OpenCL::Queue self, ...)
1249 PPCODE:
1250 cl_event ev = 0;
1251 EVENT_LIST (1, items - 1);
1252 #if CL_VERSION_1_2
1253 NEED_SUCCESS (EnqueueMarkerWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1254 #else
1255 if (event_list_count)
1256 croak ("OpenCL::Queue->enqueue_marker does not support a wait list in OpenCL 1.1 - upgrade to 1.2");
1257 NEED_SUCCESS (EnqueueMarker, (self, GIMME_V != G_VOID ? &ev : 0));
1258 #endif
1259 if (ev)
1260 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1261
1262 void
1263 enqueue_barrier (OpenCL::Queue self, ...)
1264 PPCODE:
1265 cl_event ev = 0;
1266 EVENT_LIST (1, items - 1);
1267 #if CL_VERSION_1_2
1268 NEED_SUCCESS (EnqueueBarrierWithWaitList, (self, event_list_count, event_list_ptr, &ev));
1269 #else
1270 if (event_list_count)
1271 croak ("OpenCL::Queue->enqueue_barrier does not support a wait list in OpenCL 1.1 - upgrade to 1.2");
1272 if (GIMME_V != G_VOID)
1273 croak ("OpenCL::Queue->enqueue_barrier does not return an event object in OpenCL 1.1 - upgrade to 1.2");
1274 NEED_SUCCESS (EnqueueBarrier, (self));
1275 #endif
1276 if (ev)
1277 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1278
1279 void
1280 flush (OpenCL::Queue self)
1281 CODE:
1282 NEED_SUCCESS (Flush, (self));
1283
1284 void
1285 finish (OpenCL::Queue self)
1286 CODE:
1287 NEED_SUCCESS (Finish, (self));
1288
1289 void
1290 info (OpenCL::Queue self, cl_command_queue_info name)
1291 PPCODE:
1292 INFO (CommandQueue)
1293
1294 #BEGIN:command_queue
1295
1296 void
1297 context (OpenCL::Queue self)
1298 PPCODE:
1299 cl_context value [1];
1300 NEED_SUCCESS (GetCommandQueueInfo, (self, CL_QUEUE_CONTEXT, sizeof (value), value, 0));
1301 EXTEND (SP, 1);
1302 const int i = 0;
1303 {
1304 NEED_SUCCESS (RetainContext, (value [i]));
1305 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Context", value [i]));
1306 }
1307
1308 void
1309 device (OpenCL::Queue self)
1310 PPCODE:
1311 cl_device_id value [1];
1312 NEED_SUCCESS (GetCommandQueueInfo, (self, CL_QUEUE_DEVICE, sizeof (value), value, 0));
1313 EXTEND (SP, 1);
1314 const int i = 0;
1315 {
1316 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Device", value [i]));
1317 }
1318
1319 void
1320 reference_count (OpenCL::Queue self)
1321 PPCODE:
1322 cl_uint value [1];
1323 NEED_SUCCESS (GetCommandQueueInfo, (self, CL_QUEUE_REFERENCE_COUNT, sizeof (value), value, 0));
1324 EXTEND (SP, 1);
1325 const int i = 0;
1326 PUSHs (sv_2mortal (newSVuv (value [i])));
1327
1328 void
1329 properties (OpenCL::Queue self)
1330 PPCODE:
1331 cl_command_queue_properties value [1];
1332 NEED_SUCCESS (GetCommandQueueInfo, (self, CL_QUEUE_PROPERTIES, sizeof (value), value, 0));
1333 EXTEND (SP, 1);
1334 const int i = 0;
1335 PUSHs (sv_2mortal (newSViv (value [i])));
1336
1337 #END:command_queue
1338
1339 MODULE = OpenCL PACKAGE = OpenCL::Memory
1340
1341 void
1342 DESTROY (OpenCL::Memory self)
1343 CODE:
1344 clReleaseMemObject (self);
1345
1346 void
1347 info (OpenCL::Memory self, cl_mem_info name)
1348 PPCODE:
1349 INFO (MemObject)
1350
1351 #BEGIN:mem
1352
1353 void
1354 type (OpenCL::Memory self)
1355 PPCODE:
1356 cl_mem_object_type value [1];
1357 NEED_SUCCESS (GetMemObjectInfo, (self, CL_MEM_TYPE, sizeof (value), value, 0));
1358 EXTEND (SP, 1);
1359 const int i = 0;
1360 PUSHs (sv_2mortal (newSViv (value [i])));
1361
1362 void
1363 flags (OpenCL::Memory self)
1364 PPCODE:
1365 cl_mem_flags value [1];
1366 NEED_SUCCESS (GetMemObjectInfo, (self, CL_MEM_FLAGS, sizeof (value), value, 0));
1367 EXTEND (SP, 1);
1368 const int i = 0;
1369 PUSHs (sv_2mortal (newSViv (value [i])));
1370
1371 void
1372 size (OpenCL::Memory self)
1373 ALIAS:
1374 size = CL_MEM_SIZE
1375 offset = CL_MEM_OFFSET
1376 PPCODE:
1377 size_t value [1];
1378 NEED_SUCCESS (GetMemObjectInfo, (self, ix, sizeof (value), value, 0));
1379 EXTEND (SP, 1);
1380 const int i = 0;
1381 PUSHs (sv_2mortal (newSVuv (value [i])));
1382
1383 void
1384 host_ptr (OpenCL::Memory self)
1385 PPCODE:
1386 void * value [1];
1387 NEED_SUCCESS (GetMemObjectInfo, (self, CL_MEM_HOST_PTR, sizeof (value), value, 0));
1388 EXTEND (SP, 1);
1389 const int i = 0;
1390 PUSHs (sv_2mortal (newSVuv ((IV)(intptr_t)value [i])));
1391
1392 void
1393 map_count (OpenCL::Memory self)
1394 ALIAS:
1395 map_count = CL_MEM_MAP_COUNT
1396 reference_count = CL_MEM_REFERENCE_COUNT
1397 PPCODE:
1398 cl_uint value [1];
1399 NEED_SUCCESS (GetMemObjectInfo, (self, ix, sizeof (value), value, 0));
1400 EXTEND (SP, 1);
1401 const int i = 0;
1402 PUSHs (sv_2mortal (newSVuv (value [i])));
1403
1404 void
1405 context (OpenCL::Memory self)
1406 PPCODE:
1407 cl_context value [1];
1408 NEED_SUCCESS (GetMemObjectInfo, (self, CL_MEM_CONTEXT, sizeof (value), value, 0));
1409 EXTEND (SP, 1);
1410 const int i = 0;
1411 {
1412 NEED_SUCCESS (RetainContext, (value [i]));
1413 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Context", value [i]));
1414 }
1415
1416 void
1417 associated_memobject (OpenCL::Memory self)
1418 PPCODE:
1419 cl_mem value [1];
1420 NEED_SUCCESS (GetMemObjectInfo, (self, CL_MEM_ASSOCIATED_MEMOBJECT, sizeof (value), value, 0));
1421 EXTEND (SP, 1);
1422 const int i = 0;
1423 {
1424 NEED_SUCCESS (RetainMemObject, (value [i]));
1425 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Memory", value [i]));
1426 }
1427
1428 #END:mem
1429
1430 #if cl_apple_gl_sharing || cl_khr_gl_sharing
1431
1432 void
1433 gl_object_info (OpenCL::Memory self)
1434 PPCODE:
1435 cl_gl_object_type type;
1436 cl_GLuint name;
1437 NEED_SUCCESS (GetGLObjectInfo, (self, &type, &name));
1438 EXTEND (SP, 2);
1439 PUSHs (sv_2mortal (newSVuv (type)));
1440 PUSHs (sv_2mortal (newSVuv (name)));
1441
1442 #endif
1443
1444 MODULE = OpenCL PACKAGE = OpenCL::BufferObj
1445
1446 void
1447 sub_buffer_region (OpenCL::BufferObj self, cl_mem_flags flags, size_t origin, size_t size)
1448 PPCODE:
1449 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR | CL_MEM_ALLOC_HOST_PTR))
1450 croak ("clCreateSubBuffer: cannot use/copy/alloc host ptr, doesn't make sense, check your flags!");
1451
1452 cl_buffer_region crdata = { origin, size };
1453
1454 NEED_SUCCESS_ARG (cl_mem mem, CreateSubBuffer, (self, flags, CL_BUFFER_CREATE_TYPE_REGION, &crdata, &res));
1455 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
1456
1457 MODULE = OpenCL PACKAGE = OpenCL::Image
1458
1459 void
1460 image_info (OpenCL::Image self, cl_image_info name)
1461 PPCODE:
1462 INFO (Image)
1463
1464 #BEGIN:image
1465
1466 void
1467 element_size (OpenCL::Image self)
1468 ALIAS:
1469 element_size = CL_IMAGE_ELEMENT_SIZE
1470 row_pitch = CL_IMAGE_ROW_PITCH
1471 slice_pitch = CL_IMAGE_SLICE_PITCH
1472 width = CL_IMAGE_WIDTH
1473 height = CL_IMAGE_HEIGHT
1474 depth = CL_IMAGE_DEPTH
1475 PPCODE:
1476 size_t value [1];
1477 NEED_SUCCESS (GetImageInfo, (self, ix, sizeof (value), value, 0));
1478 EXTEND (SP, 1);
1479 const int i = 0;
1480 PUSHs (sv_2mortal (newSVuv (value [i])));
1481
1482 #END:image
1483
1484 #if cl_apple_gl_sharing || cl_khr_gl_sharing
1485
1486 #BEGIN:gl_texture
1487
1488 void
1489 target (OpenCL::Image self)
1490 PPCODE:
1491 cl_GLenum value [1];
1492 NEED_SUCCESS (GetGLTextureInfo, (self, CL_GL_TEXTURE_TARGET, sizeof (value), value, 0));
1493 EXTEND (SP, 1);
1494 const int i = 0;
1495 PUSHs (sv_2mortal (newSVuv (value [i])));
1496
1497 void
1498 gl_mipmap_level (OpenCL::Image self)
1499 PPCODE:
1500 cl_GLint value [1];
1501 NEED_SUCCESS (GetGLTextureInfo, (self, CL_GL_MIPMAP_LEVEL, sizeof (value), value, 0));
1502 EXTEND (SP, 1);
1503 const int i = 0;
1504 PUSHs (sv_2mortal (newSViv (value [i])));
1505
1506 #END:gl_texture
1507
1508 #endif
1509
1510 MODULE = OpenCL PACKAGE = OpenCL::Sampler
1511
1512 void
1513 DESTROY (OpenCL::Sampler self)
1514 CODE:
1515 clReleaseSampler (self);
1516
1517 void
1518 info (OpenCL::Sampler self, cl_sampler_info name)
1519 PPCODE:
1520 INFO (Sampler)
1521
1522 #BEGIN:sampler
1523
1524 void
1525 reference_count (OpenCL::Sampler self)
1526 PPCODE:
1527 cl_uint value [1];
1528 NEED_SUCCESS (GetSamplerInfo, (self, CL_SAMPLER_REFERENCE_COUNT, sizeof (value), value, 0));
1529 EXTEND (SP, 1);
1530 const int i = 0;
1531 PUSHs (sv_2mortal (newSVuv (value [i])));
1532
1533 void
1534 context (OpenCL::Sampler self)
1535 PPCODE:
1536 cl_context value [1];
1537 NEED_SUCCESS (GetSamplerInfo, (self, CL_SAMPLER_CONTEXT, sizeof (value), value, 0));
1538 EXTEND (SP, 1);
1539 const int i = 0;
1540 {
1541 NEED_SUCCESS (RetainContext, (value [i]));
1542 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Context", value [i]));
1543 }
1544
1545 void
1546 normalized_coords (OpenCL::Sampler self)
1547 PPCODE:
1548 cl_addressing_mode value [1];
1549 NEED_SUCCESS (GetSamplerInfo, (self, CL_SAMPLER_NORMALIZED_COORDS, sizeof (value), value, 0));
1550 EXTEND (SP, 1);
1551 const int i = 0;
1552 PUSHs (sv_2mortal (newSViv (value [i])));
1553
1554 void
1555 addressing_mode (OpenCL::Sampler self)
1556 PPCODE:
1557 cl_filter_mode value [1];
1558 NEED_SUCCESS (GetSamplerInfo, (self, CL_SAMPLER_ADDRESSING_MODE, sizeof (value), value, 0));
1559 EXTEND (SP, 1);
1560 const int i = 0;
1561 PUSHs (sv_2mortal (newSViv (value [i])));
1562
1563 void
1564 filter_mode (OpenCL::Sampler self)
1565 PPCODE:
1566 cl_bool value [1];
1567 NEED_SUCCESS (GetSamplerInfo, (self, CL_SAMPLER_FILTER_MODE, sizeof (value), value, 0));
1568 EXTEND (SP, 1);
1569 const int i = 0;
1570 PUSHs (sv_2mortal (value [i] ? &PL_sv_yes : &PL_sv_no));
1571
1572 #END:sampler
1573
1574 MODULE = OpenCL PACKAGE = OpenCL::Program
1575
1576 void
1577 DESTROY (OpenCL::Program self)
1578 CODE:
1579 clReleaseProgram (self);
1580
1581 void
1582 build (OpenCL::Program self, OpenCL::Device device, SV *options = &PL_sv_undef)
1583 CODE:
1584 NEED_SUCCESS (BuildProgram, (self, 1, &device, SvPVbyte_nolen (options), 0, 0));
1585
1586 void
1587 build_info (OpenCL::Program self, OpenCL::Device device, cl_program_build_info name)
1588 PPCODE:
1589 size_t size;
1590 NEED_SUCCESS (GetProgramBuildInfo, (self, device, name, 0, 0, &size));
1591 SV *sv = sv_2mortal (newSV (size));
1592 SvUPGRADE (sv, SVt_PV);
1593 SvPOK_only (sv);
1594 SvCUR_set (sv, size);
1595 NEED_SUCCESS (GetProgramBuildInfo, (self, device, name, size, SvPVX (sv), 0));
1596 XPUSHs (sv);
1597
1598 #BEGIN:program_build
1599
1600 void
1601 build_status (OpenCL::Program self, OpenCL::Device device)
1602 PPCODE:
1603 cl_build_status value [1];
1604 NEED_SUCCESS (GetProgramBuildInfo, (self, device, CL_PROGRAM_BUILD_STATUS, sizeof (value), value, 0));
1605 EXTEND (SP, 1);
1606 const int i = 0;
1607 PUSHs (sv_2mortal (newSViv (value [i])));
1608
1609 void
1610 build_options (OpenCL::Program self, OpenCL::Device device)
1611 ALIAS:
1612 build_options = CL_PROGRAM_BUILD_OPTIONS
1613 build_log = CL_PROGRAM_BUILD_LOG
1614 PPCODE:
1615 size_t size;
1616 NEED_SUCCESS (GetProgramBuildInfo, (self, device, ix, 0, 0, &size));
1617 char *value = tmpbuf (size);
1618 NEED_SUCCESS (GetProgramBuildInfo, (self, device, ix, size, value, 0));
1619 EXTEND (SP, 1);
1620 const int i = 0;
1621 PUSHs (sv_2mortal (newSVpv (value, 0)));
1622
1623 #END:program_build
1624
1625 void
1626 kernel (OpenCL::Program program, SV *function)
1627 PPCODE:
1628 NEED_SUCCESS_ARG (cl_kernel kernel, CreateKernel, (program, SvPVbyte_nolen (function), &res));
1629 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel);
1630
1631 void
1632 info (OpenCL::Program self, cl_program_info name)
1633 PPCODE:
1634 INFO (Program)
1635
1636 void
1637 binaries (OpenCL::Program self)
1638 PPCODE:
1639 cl_uint n, i;
1640 size_t size;
1641
1642 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_NUM_DEVICES , sizeof (n) , &n , 0));
1643 if (!n) XSRETURN_EMPTY;
1644
1645 size_t *sizes = tmpbuf (sizeof (*sizes) * n);
1646 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_BINARY_SIZES, sizeof (*sizes) * n, sizes, &size));
1647 if (size != sizeof (*sizes) * n) XSRETURN_EMPTY;
1648 unsigned char **ptrs = tmpbuf (sizeof (*ptrs) * n);
1649
1650 EXTEND (SP, n);
1651 for (i = 0; i < n; ++i)
1652 {
1653 SV *sv = sv_2mortal (newSV (sizes [i]));
1654 SvUPGRADE (sv, SVt_PV);
1655 SvPOK_only (sv);
1656 SvCUR_set (sv, sizes [i]);
1657 ptrs [i] = (void *)SvPVX (sv);
1658 PUSHs (sv);
1659 }
1660
1661 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_BINARIES , sizeof (*ptrs ) * n, ptrs , &size));
1662 if (size != sizeof (*ptrs) * n) XSRETURN_EMPTY;
1663
1664 #BEGIN:program
1665
1666 void
1667 reference_count (OpenCL::Program self)
1668 ALIAS:
1669 reference_count = CL_PROGRAM_REFERENCE_COUNT
1670 num_devices = CL_PROGRAM_NUM_DEVICES
1671 PPCODE:
1672 cl_uint value [1];
1673 NEED_SUCCESS (GetProgramInfo, (self, ix, sizeof (value), value, 0));
1674 EXTEND (SP, 1);
1675 const int i = 0;
1676 PUSHs (sv_2mortal (newSVuv (value [i])));
1677
1678 void
1679 context (OpenCL::Program self)
1680 PPCODE:
1681 cl_context value [1];
1682 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_CONTEXT, sizeof (value), value, 0));
1683 EXTEND (SP, 1);
1684 const int i = 0;
1685 {
1686 NEED_SUCCESS (RetainContext, (value [i]));
1687 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Context", value [i]));
1688 }
1689
1690 void
1691 devices (OpenCL::Program self)
1692 PPCODE:
1693 size_t size;
1694 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_DEVICES, 0, 0, &size));
1695 cl_device_id *value = tmpbuf (size);
1696 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_DEVICES, size, value, 0));
1697 int i, n = size / sizeof (*value);
1698 EXTEND (SP, n);
1699 for (i = 0; i < n; ++i)
1700 {
1701 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Device", value [i]));
1702 }
1703
1704 void
1705 source (OpenCL::Program self)
1706 PPCODE:
1707 size_t size;
1708 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_SOURCE, 0, 0, &size));
1709 char *value = tmpbuf (size);
1710 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_SOURCE, size, value, 0));
1711 EXTEND (SP, 1);
1712 const int i = 0;
1713 PUSHs (sv_2mortal (newSVpv (value, 0)));
1714
1715 void
1716 binary_sizes (OpenCL::Program self)
1717 PPCODE:
1718 size_t size;
1719 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_BINARY_SIZES, 0, 0, &size));
1720 size_t *value = tmpbuf (size);
1721 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_BINARY_SIZES, size, value, 0));
1722 int i, n = size / sizeof (*value);
1723 EXTEND (SP, n);
1724 for (i = 0; i < n; ++i)
1725 PUSHs (sv_2mortal (newSVuv (value [i])));
1726
1727 #END:program
1728
1729 MODULE = OpenCL PACKAGE = OpenCL::Kernel
1730
1731 void
1732 DESTROY (OpenCL::Kernel self)
1733 CODE:
1734 clReleaseKernel (self);
1735
1736 void
1737 set_char (OpenCL::Kernel self, cl_uint idx, cl_char value)
1738 CODE:
1739 clSetKernelArg (self, idx, sizeof (value), &value);
1740
1741 void
1742 set_uchar (OpenCL::Kernel self, cl_uint idx, cl_uchar value)
1743 CODE:
1744 clSetKernelArg (self, idx, sizeof (value), &value);
1745
1746 void
1747 set_short (OpenCL::Kernel self, cl_uint idx, cl_short value)
1748 CODE:
1749 clSetKernelArg (self, idx, sizeof (value), &value);
1750
1751 void
1752 set_ushort (OpenCL::Kernel self, cl_uint idx, cl_ushort value)
1753 CODE:
1754 clSetKernelArg (self, idx, sizeof (value), &value);
1755
1756 void
1757 set_int (OpenCL::Kernel self, cl_uint idx, cl_int value)
1758 CODE:
1759 clSetKernelArg (self, idx, sizeof (value), &value);
1760
1761 void
1762 set_uint (OpenCL::Kernel self, cl_uint idx, cl_uint value)
1763 CODE:
1764 clSetKernelArg (self, idx, sizeof (value), &value);
1765
1766 void
1767 set_long (OpenCL::Kernel self, cl_uint idx, cl_long value)
1768 CODE:
1769 clSetKernelArg (self, idx, sizeof (value), &value);
1770
1771 void
1772 set_ulong (OpenCL::Kernel self, cl_uint idx, cl_ulong value)
1773 CODE:
1774 clSetKernelArg (self, idx, sizeof (value), &value);
1775
1776 void
1777 set_half (OpenCL::Kernel self, cl_uint idx, cl_half value)
1778 CODE:
1779 clSetKernelArg (self, idx, sizeof (value), &value);
1780
1781 void
1782 set_float (OpenCL::Kernel self, cl_uint idx, cl_float value)
1783 CODE:
1784 clSetKernelArg (self, idx, sizeof (value), &value);
1785
1786 void
1787 set_double (OpenCL::Kernel self, cl_uint idx, cl_double value)
1788 CODE:
1789 clSetKernelArg (self, idx, sizeof (value), &value);
1790
1791 void
1792 set_memory (OpenCL::Kernel self, cl_uint idx, OpenCL::Memory_ornull value)
1793 CODE:
1794 clSetKernelArg (self, idx, sizeof (value), &value);
1795
1796 void
1797 set_buffer (OpenCL::Kernel self, cl_uint idx, OpenCL::Buffer_ornull value)
1798 CODE:
1799 clSetKernelArg (self, idx, sizeof (value), &value);
1800
1801 void
1802 set_image2d (OpenCL::Kernel self, cl_uint idx, OpenCL::Image2D_ornull value)
1803 CODE:
1804 clSetKernelArg (self, idx, sizeof (value), &value);
1805
1806 void
1807 set_image3d (OpenCL::Kernel self, cl_uint idx, OpenCL::Image3D_ornull value)
1808 CODE:
1809 clSetKernelArg (self, idx, sizeof (value), &value);
1810
1811 void
1812 set_sampler (OpenCL::Kernel self, cl_uint idx, OpenCL::Sampler value)
1813 CODE:
1814 clSetKernelArg (self, idx, sizeof (value), &value);
1815
1816 void
1817 set_local (OpenCL::Kernel self, cl_uint idx, size_t size)
1818 CODE:
1819 clSetKernelArg (self, idx, size, 0);
1820
1821 void
1822 set_event (OpenCL::Kernel self, cl_uint idx, OpenCL::Event value)
1823 CODE:
1824 clSetKernelArg (self, idx, sizeof (value), &value);
1825
1826 void
1827 info (OpenCL::Kernel self, cl_kernel_info name)
1828 PPCODE:
1829 INFO (Kernel)
1830
1831 #BEGIN:kernel
1832
1833 void
1834 function_name (OpenCL::Kernel self)
1835 PPCODE:
1836 size_t size;
1837 NEED_SUCCESS (GetKernelInfo, (self, CL_KERNEL_FUNCTION_NAME, 0, 0, &size));
1838 char *value = tmpbuf (size);
1839 NEED_SUCCESS (GetKernelInfo, (self, CL_KERNEL_FUNCTION_NAME, size, value, 0));
1840 EXTEND (SP, 1);
1841 const int i = 0;
1842 PUSHs (sv_2mortal (newSVpv (value, 0)));
1843
1844 void
1845 num_args (OpenCL::Kernel self)
1846 ALIAS:
1847 num_args = CL_KERNEL_NUM_ARGS
1848 reference_count = CL_KERNEL_REFERENCE_COUNT
1849 PPCODE:
1850 cl_uint value [1];
1851 NEED_SUCCESS (GetKernelInfo, (self, ix, sizeof (value), value, 0));
1852 EXTEND (SP, 1);
1853 const int i = 0;
1854 PUSHs (sv_2mortal (newSVuv (value [i])));
1855
1856 void
1857 context (OpenCL::Kernel self)
1858 PPCODE:
1859 cl_context value [1];
1860 NEED_SUCCESS (GetKernelInfo, (self, CL_KERNEL_CONTEXT, sizeof (value), value, 0));
1861 EXTEND (SP, 1);
1862 const int i = 0;
1863 {
1864 NEED_SUCCESS (RetainContext, (value [i]));
1865 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Context", value [i]));
1866 }
1867
1868 void
1869 program (OpenCL::Kernel self)
1870 PPCODE:
1871 cl_program value [1];
1872 NEED_SUCCESS (GetKernelInfo, (self, CL_KERNEL_PROGRAM, sizeof (value), value, 0));
1873 EXTEND (SP, 1);
1874 const int i = 0;
1875 {
1876 NEED_SUCCESS (RetainProgram, (value [i]));
1877 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Program", value [i]));
1878 }
1879
1880 #END:kernel
1881
1882 void
1883 work_group_info (OpenCL::Kernel self, OpenCL::Device device, cl_kernel_work_group_info name)
1884 PPCODE:
1885 size_t size;
1886 NEED_SUCCESS (GetKernelWorkGroupInfo, (self, device, name, 0, 0, &size));
1887 SV *sv = sv_2mortal (newSV (size));
1888 SvUPGRADE (sv, SVt_PV);
1889 SvPOK_only (sv);
1890 SvCUR_set (sv, size);
1891 NEED_SUCCESS (GetKernelWorkGroupInfo, (self, device, name, size, SvPVX (sv), 0));
1892 XPUSHs (sv);
1893
1894 #BEGIN:kernel_work_group
1895
1896 void
1897 work_group_size (OpenCL::Kernel self, OpenCL::Device device)
1898 ALIAS:
1899 work_group_size = CL_KERNEL_WORK_GROUP_SIZE
1900 preferred_work_group_size_multiple = CL_KERNEL_PREFERRED_WORK_GROUP_SIZE_MULTIPLE
1901 PPCODE:
1902 size_t value [1];
1903 NEED_SUCCESS (GetKernelWorkGroupInfo, (self, device, ix, sizeof (value), value, 0));
1904 EXTEND (SP, 1);
1905 const int i = 0;
1906 PUSHs (sv_2mortal (newSVuv (value [i])));
1907
1908 void
1909 compile_work_group_size (OpenCL::Kernel self, OpenCL::Device device)
1910 PPCODE:
1911 size_t size;
1912 NEED_SUCCESS (GetKernelWorkGroupInfo, (self, device, CL_KERNEL_COMPILE_WORK_GROUP_SIZE, 0, 0, &size));
1913 size_t *value = tmpbuf (size);
1914 NEED_SUCCESS (GetKernelWorkGroupInfo, (self, device, CL_KERNEL_COMPILE_WORK_GROUP_SIZE, size, value, 0));
1915 int i, n = size / sizeof (*value);
1916 EXTEND (SP, n);
1917 for (i = 0; i < n; ++i)
1918 PUSHs (sv_2mortal (newSVuv (value [i])));
1919
1920 void
1921 local_mem_size (OpenCL::Kernel self, OpenCL::Device device)
1922 ALIAS:
1923 local_mem_size = CL_KERNEL_LOCAL_MEM_SIZE
1924 private_mem_size = CL_KERNEL_PRIVATE_MEM_SIZE
1925 PPCODE:
1926 cl_ulong value [1];
1927 NEED_SUCCESS (GetKernelWorkGroupInfo, (self, device, ix, sizeof (value), value, 0));
1928 EXTEND (SP, 1);
1929 const int i = 0;
1930 PUSHs (sv_2mortal (newSVuv (value [i])));
1931
1932 #END:kernel_work_group
1933
1934 MODULE = OpenCL PACKAGE = OpenCL::Event
1935
1936 void
1937 DESTROY (OpenCL::Event self)
1938 CODE:
1939 clReleaseEvent (self);
1940
1941 void
1942 wait (OpenCL::Event self)
1943 CODE:
1944 clWaitForEvents (1, &self);
1945
1946 void
1947 info (OpenCL::Event self, cl_event_info name)
1948 PPCODE:
1949 INFO (Event)
1950
1951 #BEGIN:event
1952
1953 void
1954 command_queue (OpenCL::Event self)
1955 PPCODE:
1956 cl_command_queue value [1];
1957 NEED_SUCCESS (GetEventInfo, (self, CL_EVENT_COMMAND_QUEUE, sizeof (value), value, 0));
1958 EXTEND (SP, 1);
1959 const int i = 0;
1960 {
1961 NEED_SUCCESS (RetainCommandQueue, (value [i]));
1962 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Queue", value [i]));
1963 }
1964
1965 void
1966 command_type (OpenCL::Event self)
1967 PPCODE:
1968 cl_command_type value [1];
1969 NEED_SUCCESS (GetEventInfo, (self, CL_EVENT_COMMAND_TYPE, sizeof (value), value, 0));
1970 EXTEND (SP, 1);
1971 const int i = 0;
1972 PUSHs (sv_2mortal (newSVuv (value [i])));
1973
1974 void
1975 reference_count (OpenCL::Event self)
1976 ALIAS:
1977 reference_count = CL_EVENT_REFERENCE_COUNT
1978 command_execution_status = CL_EVENT_COMMAND_EXECUTION_STATUS
1979 PPCODE:
1980 cl_uint value [1];
1981 NEED_SUCCESS (GetEventInfo, (self, ix, sizeof (value), value, 0));
1982 EXTEND (SP, 1);
1983 const int i = 0;
1984 PUSHs (sv_2mortal (newSVuv (value [i])));
1985
1986 void
1987 context (OpenCL::Event self)
1988 PPCODE:
1989 cl_context value [1];
1990 NEED_SUCCESS (GetEventInfo, (self, CL_EVENT_CONTEXT, sizeof (value), value, 0));
1991 EXTEND (SP, 1);
1992 const int i = 0;
1993 {
1994 NEED_SUCCESS (RetainContext, (value [i]));
1995 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Context", value [i]));
1996 }
1997
1998 #END:event
1999
2000 void
2001 profiling_info (OpenCL::Event self, cl_profiling_info name)
2002 PPCODE:
2003 INFO (EventProfiling)
2004
2005 #BEGIN:profiling
2006
2007 void
2008 profiling_command_queued (OpenCL::Event self)
2009 ALIAS:
2010 profiling_command_queued = CL_PROFILING_COMMAND_QUEUED
2011 profiling_command_submit = CL_PROFILING_COMMAND_SUBMIT
2012 profiling_command_start = CL_PROFILING_COMMAND_START
2013 profiling_command_end = CL_PROFILING_COMMAND_END
2014 PPCODE:
2015 cl_ulong value [1];
2016 NEED_SUCCESS (GetEventProfilingInfo, (self, ix, sizeof (value), value, 0));
2017 EXTEND (SP, 1);
2018 const int i = 0;
2019 PUSHs (sv_2mortal (newSVuv (value [i])));
2020
2021 #END:profiling
2022
2023 MODULE = OpenCL PACKAGE = OpenCL::UserEvent
2024
2025 void
2026 set_status (OpenCL::UserEvent self, cl_int execution_status)
2027 CODE:
2028 clSetUserEventStatus (self, execution_status);
2029