ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/OpenCL/OpenCL.xs
(Generate patch)

Comparing OpenCL/OpenCL.xs (file contents):
Revision 1.33 by root, Fri Apr 20 08:57:09 2012 UTC vs.
Revision 1.40 by root, Sat Apr 21 19:49:40 2012 UTC

3#include "XSUB.h" 3#include "XSUB.h"
4 4
5#ifdef I_DLFCN 5#ifdef I_DLFCN
6 #include <dlfcn.h> 6 #include <dlfcn.h>
7#endif 7#endif
8
9// how stupid is that, the 1.2 header files define CL_VERSION_1_1,
10// but then fail to define the api functions unless you ALSO define
11// this. This breaks 100% of the opencl 1.1 apps, for what reason?
12// after all, the functions are deprecated, not removed.
13// in addition, you cannot test for this in any future-proof way.
14// each time a new opencl version comes out, you need to make a new
15// release.
16#define CL_USE_DEPRECATED_OPENCL_1_1_APIS
17#define CL_USE_DEPRECATED_OPENCL_1_2_APIS /* just guessing, you stupid idiots */
8 18
9#ifdef __APPLE__ 19#ifdef __APPLE__
10 #include <OpenCL/opencl.h> 20 #include <OpenCL/opencl.h>
11#else 21#else
12 #include <CL/opencl.h> 22 #include <CL/opencl.h>
23#endif
24
25#if 0 // testing
26#undef CL_USE_DEPRECATED_OPENCL_1_1_APIS
27#undef CL_VERSION_1_2
13#endif 28#endif
14 29
15typedef cl_platform_id OpenCL__Platform; 30typedef cl_platform_id OpenCL__Platform;
16typedef cl_device_id OpenCL__Device; 31typedef cl_device_id OpenCL__Device;
17typedef cl_context OpenCL__Context; 32typedef cl_context OpenCL__Context;
89 enum { buffers = 3 }; 104 enum { buffers = 3 };
90 static int idx; 105 static int idx;
91 static void *buf [buffers]; 106 static void *buf [buffers];
92 static size_t len [buffers]; 107 static size_t len [buffers];
93 108
94 idx = ++idx % buffers; 109 idx = (idx + 1) % buffers;
95 110
96 if (len [idx] < size) 111 if (len [idx] < size)
97 { 112 {
98 free (buf [idx]); 113 free (buf [idx]);
99 len [idx] = ((size + 31) & ~4095) + 4096 - 32; 114 len [idx] = ((size + 31) & ~4095) + 4096 - 32;
257 clGetImageInfo (img, CL_IMAGE_ROW_PITCH, sizeof (res), &res, 0); 272 clGetImageInfo (img, CL_IMAGE_ROW_PITCH, sizeof (res), &res, 0);
258 return res; 273 return res;
259} 274}
260 275
261static cl_event * 276static cl_event *
262event_list (SV **items, int count) 277event_list (SV **items, cl_uint *rcount)
263{ 278{
279 cl_uint count = *rcount;
280
264 if (!count) 281 if (!count)
265 return 0; 282 return 0;
266 283
267 cl_event *list = tmpbuf (sizeof (cl_event) * count); 284 cl_event *list = tmpbuf (sizeof (cl_event) * count);
285 int i = 0;
268 286
269 while (count--) 287 do
288 {
289 --count;
290 if (SvOK (items [count]))
270 list [count] = SvPTROBJ ("clEnqueue", "wait_events", items [count], "OpenCL::Event"); 291 list [i++] = SvPTROBJ ("clEnqueue", "wait_events", items [count], "OpenCL::Event");
292 }
293 while (count);
271 294
295 *rcount = i;
296
272 return list; 297 return i ? list : 0;
273} 298}
274 299
275#define EVENT_LIST(items,count) \ 300#define EVENT_LIST(items,count) \
276 cl_uint event_list_count = (count); \ 301 cl_uint event_list_count = (count); \
277 cl_event *event_list_ptr = event_list (&ST (items), event_list_count) 302 cl_event *event_list_ptr = event_list (&ST (items), &event_list_count)
278 303
279#define INFO(class) \ 304#define INFO(class) \
280{ \ 305{ \
281 size_t size; \ 306 size_t size; \
282 NEED_SUCCESS (Get ## class ## Info, (self, name, 0, 0, &size)); \ 307 NEED_SUCCESS (Get ## class ## Info, (self, name, 0, 0, &size)); \
314} 339}
315 340
316cl_int 341cl_int
317errno () 342errno ()
318 CODE: 343 CODE:
319 errno = res; 344 RETVAL = res;
345 OUTPUT:
346 RETVAL
320 347
321const char * 348const char *
322err2str (cl_int err) 349err2str (cl_int err)
323 350
324const char * 351const char *
343context_from_type (cl_context_properties *properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0) 370context_from_type (cl_context_properties *properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
344 PPCODE: 371 PPCODE:
345 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (properties, type, 0, 0, &res)); 372 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (properties, type, 0, 0, &res));
346 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 373 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
347 374
375#if 0
376
348void 377void
349context (cl_context_properties *properties = 0, FUTURE devices, FUTURE notify = 0) 378context (cl_context_properties *properties = 0, FUTURE devices, FUTURE notify = 0)
350 PPCODE: 379 PPCODE:
351 /* der Gipfel der Kunst */ 380 /* der Gipfel der Kunst */
381
382#endif
352 383
353void 384void
354wait_for_events (...) 385wait_for_events (...)
355 CODE: 386 CODE:
356 EVENT_LIST (0, items); 387 EVENT_LIST (0, items);
698 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) 729 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)))
699 croak ("OpenCL::Context::buffer_sv: you have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?"); 730 croak ("OpenCL::Context::buffer_sv: you have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?");
700 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (self, flags, len, ptr, &res)); 731 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (self, flags, len, ptr, &res));
701 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem); 732 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem);
702 733
734#if !CL_VERSION_1_2 || defined CL_USE_DEPRECATED_OPENCL_1_1_APIS
735
703void 736void
704image2d (OpenCL::Context self, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t row_pitch = 0, SV *data = &PL_sv_undef) 737image2d (OpenCL::Context self, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t row_pitch = 0, SV *data = &PL_sv_undef)
705 PPCODE: 738 PPCODE:
706 STRLEN len; 739 STRLEN len;
707 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0; 740 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0;
716 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0; 749 char *ptr = SvOK (data) ? SvPVbyte (data, len) : 0;
717 const cl_image_format format = { channel_order, channel_type }; 750 const cl_image_format format = { channel_order, channel_type };
718 NEED_SUCCESS_ARG (cl_mem mem, CreateImage3D, (self, flags, &format, width, height, depth, row_pitch, slice_pitch, ptr, &res)); 751 NEED_SUCCESS_ARG (cl_mem mem, CreateImage3D, (self, flags, &format, width, height, depth, row_pitch, slice_pitch, ptr, &res));
719 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem); 752 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
720 753
754#endif
755
721#if cl_apple_gl_sharing || cl_khr_gl_sharing 756#if cl_apple_gl_sharing || cl_khr_gl_sharing
722 757
723void 758void
724gl_buffer (OpenCL::Context self, cl_mem_flags flags, cl_GLuint bufobj) 759gl_buffer (OpenCL::Context self, cl_mem_flags flags, cl_GLuint bufobj)
725 PPCODE: 760 PPCODE:
726 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLBuffer, (self, flags, bufobj, &res)); 761 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLBuffer, (self, flags, bufobj, &res));
727 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem); 762 XPUSH_NEW_OBJ ("OpenCL::BufferObj", mem);
728 763
729void 764void
765gl_renderbuffer (OpenCL::Context self, cl_mem_flags flags, cl_GLuint renderbuffer)
766 PPCODE:
767 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLRenderbuffer, (self, flags, renderbuffer, &res));
768 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
769
770#if CL_VERSION_1_2
771
772void
773gl_texture (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture)
774 PPCODE:
775 char *klass = "OpenCL::Memory";
776 cl_gl_object_type t;
777 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture2D, (self, flags, target, miplevel, texture, &res));
778 NEED_SUCCESS (GetGLObjectInfo, (mem, &t, 0));
779 switch (t)
780 {
781 case CL_GL_OBJECT_TEXTURE_BUFFER: klass = "OpenCL::Image1DBuffer"; break;
782 case CL_GL_OBJECT_TEXTURE1D: klass = "OpenCL::Image1D"; break;
783 case CL_GL_OBJECT_TEXTURE1D_ARRAY: klass = "OpenCL::Image2DArray"; break;
784 case CL_GL_OBJECT_TEXTURE2D: klass = "OpenCL::Image2D"; break;
785 case CL_GL_OBJECT_TEXTURE2D_ARRAY: klass = "OpenCL::Image2DArray"; break;
786 case CL_GL_OBJECT_TEXTURE3D: klass = "OpenCL::Image3D"; break;
787 }
788 XPUSH_NEW_OBJ (klass, mem);
789
790#endif
791
792#if !CL_VERSION_1_2 || defined CL_USE_DEPRECATED_OPENCL_1_1_APIS
793
794void
730gl_texture2d (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture) 795gl_texture2d (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture)
731 PPCODE: 796 PPCODE:
732 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture2D, (self, flags, target, miplevel, texture, &res)); 797 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture2D, (self, flags, target, miplevel, texture, &res));
733 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem); 798 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
734 799
736gl_texture3d (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture) 801gl_texture3d (OpenCL::Context self, cl_mem_flags flags, cl_GLenum target, cl_GLint miplevel, cl_GLuint texture)
737 PPCODE: 802 PPCODE:
738 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture3D, (self, flags, target, miplevel, texture, &res)); 803 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLTexture3D, (self, flags, target, miplevel, texture, &res));
739 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem); 804 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
740 805
741void 806#endif
742gl_renderbuffer (OpenCL::Context self, cl_mem_flags flags, cl_GLuint renderbuffer)
743 PPCODE:
744 NEED_SUCCESS_ARG (cl_mem mem, CreateFromGLRenderbuffer, (self, flags, renderbuffer, &res));
745 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
746 807
747#endif 808#endif
748 809
749void 810void
750supported_image_formats (OpenCL::Context self, cl_mem_flags flags, cl_mem_object_type image_type) 811supported_image_formats (OpenCL::Context self, cl_mem_flags flags, cl_mem_object_type image_type)
855 cl_event ev = 0; 916 cl_event ev = 0;
856 STRLEN len; 917 STRLEN len;
857 char *ptr = SvPVbyte (data, len); 918 char *ptr = SvPVbyte (data, len);
858 EVENT_LIST (5, items - 5); 919 EVENT_LIST (5, items - 5);
859 920
860 NEED_SUCCESS (EnqueueReadBuffer, (self, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 921 NEED_SUCCESS (EnqueueWriteBuffer, (self, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
861 922
862 if (ev) 923 if (ev)
863 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 924 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
864 925
865void 926void
931 size_t min_len = host_row_pitch * host_slice_pitch * region [2]; 992 size_t min_len = host_row_pitch * host_slice_pitch * region [2];
932 993
933 if (len < min_len) 994 if (len < min_len)
934 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred"); 995 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred");
935 996
936 NEED_SUCCESS (EnqueueWriteBufferRect, (self, buf, blocking, buf_origin, host_origin, region, buf_row_pitch, buf_slice_pitch, host_row_pitch, host_slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 997 NEED_SUCCESS (EnqueueWriteBufferRect, (self, buf, blocking, buf_origin, host_origin, region, buf_row_pitch, buf_slice_pitch, host_row_pitch, host_slice_pitch, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
937 998
938 if (ev) 999 if (ev)
939 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 1000 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
940 1001
941void 1002void
996 size_t min_len = slice_pitch ? slice_pitch * depth : row_pitch * height; 1057 size_t min_len = slice_pitch ? slice_pitch * depth : row_pitch * height;
997 1058
998 if (len < min_len) 1059 if (len < min_len)
999 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred"); 1060 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred");
1000 1061
1001 NEED_SUCCESS (EnqueueWriteImage, (self, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 1062 NEED_SUCCESS (EnqueueWriteImage, (self, dst, blocking, dst_origin, region, row_pitch, slice_pitch, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1002 1063
1003 if (ev) 1064 if (ev)
1004 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 1065 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1005 1066
1006void 1067void
1088 gwo [i] = SvIV (AvARRAY (SvRV (global_work_offset))[i]); 1149 gwo [i] = SvIV (AvARRAY (SvRV (global_work_offset))[i]);
1089 } 1150 }
1090 1151
1091 if (SvOK (local_work_size)) 1152 if (SvOK (local_work_size))
1092 { 1153 {
1093 if (SvOK (local_work_size) && !SvROK (local_work_size) || SvTYPE (SvRV (local_work_size)) != SVt_PVAV) 1154 if ((SvOK (local_work_size) && !SvROK (local_work_size)) || SvTYPE (SvRV (local_work_size)) != SVt_PVAV)
1094 croak ("clEnqueueNDRangeKernel: global_work_size must be undef or an array reference"); 1155 croak ("clEnqueueNDRangeKernel: global_work_size must be undef or an array reference");
1095 1156
1096 if (AvFILLp (SvRV (local_work_size)) + 1 != gws_len) 1157 if (AvFILLp (SvRV (local_work_size)) + 1 != gws_len)
1097 croak ("clEnqueueNDRangeKernel: local_work_local must be undef or an array of same size as global_work_size"); 1158 croak ("clEnqueueNDRangeKernel: local_work_local must be undef or an array of same size as global_work_size");
1098 1159
1110 1171
1111void 1172void
1112enqueue_acquire_gl_objects (OpenCL::Queue self, SV *objects, ...) 1173enqueue_acquire_gl_objects (OpenCL::Queue self, SV *objects, ...)
1113 ALIAS: 1174 ALIAS:
1114 enqueue_release_gl_objects = 1 1175 enqueue_release_gl_objects = 1
1115 CODE: 1176 PPCODE:
1116 if (!SvROK (objects) || SvTYPE (SvRV (objects)) != SVt_PVAV) 1177 if (!SvROK (objects) || SvTYPE (SvRV (objects)) != SVt_PVAV)
1117 croak ("OpenCL::Queue::enqueue_acquire/release_gl_objects argument 'objects' must be an arrayref with memory objects, in call"); 1178 croak ("OpenCL::Queue::enqueue_acquire/release_gl_objects argument 'objects' must be an arrayref with memory objects, in call");
1118 1179
1119 cl_event ev = 0; 1180 cl_event ev = 0;
1120 EVENT_LIST (2, items - 2); 1181 EVENT_LIST (2, items - 2);
1134 if (ev) 1195 if (ev)
1135 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 1196 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1136 1197
1137#endif 1198#endif
1138 1199
1139void 1200#if !CL_VERSION_1_2 || defined CL_USE_DEPRECATED_OPENCL_1_1_APIS
1140enqueue_marker (OpenCL::Queue self)
1141 PPCODE:
1142 cl_event ev;
1143 NEED_SUCCESS (EnqueueMarker, (self, &ev));
1144 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1145 1201
1146void 1202void
1147enqueue_wait_for_events (OpenCL::Queue self, ...) 1203enqueue_wait_for_events (OpenCL::Queue self, ...)
1148 CODE: 1204 CODE:
1149 EVENT_LIST (1, items - 1); 1205 EVENT_LIST (1, items - 1);
1150 NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr)); 1206 NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr));
1151 1207
1208#endif
1209
1152void 1210void
1211enqueue_marker (OpenCL::Queue self, ...)
1212 PPCODE:
1213 cl_event ev = 0;
1214 EVENT_LIST (1, items - 1);
1215#if CL_VERSION_1_2
1216 NEED_SUCCESS (EnqueueMarkerWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
1217#else
1218 if (event_list_count)
1219 croak ("OpenCL::Queue->enqueue_marker does not support a wait list in OpenCL 1.1 - upgrade to 1.2");
1220 NEED_SUCCESS (EnqueueMarker, (self, GIMME_V != G_VOID ? &ev : 0));
1221#endif
1222 if (ev)
1223 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1224
1225void
1153enqueue_barrier (OpenCL::Queue self) 1226enqueue_barrier (OpenCL::Queue self, ...)
1154 CODE: 1227 PPCODE:
1228 cl_event ev = 0;
1229 EVENT_LIST (1, items - 1);
1230#if CL_VERSION_1_2
1231 NEED_SUCCESS (EnqueueBarrierWithWaitList, (self, event_list_count, event_list_ptr, &ev));
1232#else
1233 if (event_list_count)
1234 croak ("OpenCL::Queue->enqueue_barrier does not support a wait list in OpenCL 1.1 - upgrade to 1.2");
1235 if (GIMME_V != G_VOID)
1236 croak ("OpenCL::Queue->enqueue_barrier does not return an event object in OpenCL 1.1 - upgrade to 1.2");
1155 NEED_SUCCESS (EnqueueBarrier, (self)); 1237 NEED_SUCCESS (EnqueueBarrier, (self));
1238#endif
1239 if (ev)
1240 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
1156 1241
1157void 1242void
1158flush (OpenCL::Queue self) 1243flush (OpenCL::Queue self)
1159 CODE: 1244 CODE:
1160 NEED_SUCCESS (Flush, (self)); 1245 NEED_SUCCESS (Flush, (self));
1530 { 1615 {
1531 SV *sv = sv_2mortal (newSV (sizes [i])); 1616 SV *sv = sv_2mortal (newSV (sizes [i]));
1532 SvUPGRADE (sv, SVt_PV); 1617 SvUPGRADE (sv, SVt_PV);
1533 SvPOK_only (sv); 1618 SvPOK_only (sv);
1534 SvCUR_set (sv, sizes [i]); 1619 SvCUR_set (sv, sizes [i]);
1535 ptrs [i] = SvPVX (sv); 1620 ptrs [i] = (void *)SvPVX (sv);
1536 PUSHs (sv); 1621 PUSHs (sv);
1537 } 1622 }
1538 1623
1539 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_BINARIES , sizeof (*ptrs ) * n, ptrs , &size)); 1624 NEED_SUCCESS (GetProgramInfo, (self, CL_PROGRAM_BINARIES , sizeof (*ptrs ) * n, ptrs , &size));
1540 if (size != sizeof (*ptrs) * n) XSRETURN_EMPTY; 1625 if (size != sizeof (*ptrs) * n) XSRETURN_EMPTY;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines