ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/OpenCL/OpenCL.xs
(Generate patch)

Comparing OpenCL/OpenCL.xs (file contents):
Revision 1.4 by root, Tue Nov 15 21:13:42 2011 UTC vs.
Revision 1.11 by root, Thu Nov 17 04:17:43 2011 UTC

20typedef cl_mem OpenCL__Image3D_ornull; 20typedef cl_mem OpenCL__Image3D_ornull;
21typedef cl_sampler OpenCL__Sampler; 21typedef cl_sampler OpenCL__Sampler;
22typedef cl_program OpenCL__Program; 22typedef cl_program OpenCL__Program;
23typedef cl_kernel OpenCL__Kernel; 23typedef cl_kernel OpenCL__Kernel;
24typedef cl_event OpenCL__Event; 24typedef cl_event OpenCL__Event;
25typedef cl_event OpenCL__UserEvent;
26
27typedef SV *FUTURE;
28
29/*****************************************************************************/
30
31/* up to two temporary buffers */
32static void *
33tmpbuf (size_t size)
34{
35 static int idx;
36 static void *buf [2];
37 static size_t len [2];
38
39 idx ^= 1;
40
41 if (len [idx] < size)
42 {
43 free (buf [idx]);
44 len [idx] = ((size + 31) & ~4095) + 4096 - 32;
45 buf [idx] = malloc (len [idx]);
46 }
47
48 return buf [idx];
49}
50
51/*****************************************************************************/
25 52
26typedef struct 53typedef struct
27{ 54{
28 IV iv; 55 IV iv;
29 const char *name; 56 const char *name;
63 }; 90 };
64 91
65 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)"); 92 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)");
66} 93}
67 94
95/*****************************************************************************/
96
97static cl_int res;
98
68#define FAIL(name,res) \ 99#define FAIL(name) \
69 croak ("cl" # name ": %s", err2str (res)); 100 croak ("cl" # name ": %s", err2str (res));
70 101
71#define NEED_SUCCESS(name,args) \ 102#define NEED_SUCCESS(name,args) \
72 do { \ 103 do { \
73 cl_int res = cl ## name args; \ 104 res = cl ## name args; \
74 \ 105 \
75 if (res) \ 106 if (res) \
76 FAIL (name, res); \ 107 FAIL (name); \
77 } while (0) 108 } while (0)
109
110#define NEED_SUCCESS_ARG(retdecl, name, args) \
111 retdecl = cl ## name args; \
112 if (res) \
113 FAIL (name);
114
115/*****************************************************************************/
78 116
79#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr) 117#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr)
80#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr)) 118#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr))
81 119
82/*TODO*/ 120static void *
83#define EVENT_LIST(items,count) cl_uint event_list_count = 0; cl_event *event_list_ptr = 0 121SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
122{
123 if (SvROK (sv) && sv_derived_from (sv, pkg))
124 return (void *)SvIV (SvRV (sv));
125
126 croak ("%s: %s is not of type %s", func, svname, pkg);
127}
128
129/*****************************************************************************/
130
131static size_t
132img_row_pitch (cl_mem img)
133{
134 size_t res;
135 clGetImageInfo (img, CL_IMAGE_ROW_PITCH, sizeof (res), &res, 0);
136 return res;
137}
138
139static cl_event *
140event_list (SV **items, int count)
141{
142 cl_event *list = tmpbuf (sizeof (cl_event) * count);
143
144 while (count--)
145 list [count] = SvPTROBJ ("clEnqueue", "wait_events", items [count], "OpenCL::Event");
146
147 return list;
148}
149
150#define EVENT_LIST(items,count) \
151 cl_uint event_list_count = (count); \
152 cl_event *event_list_ptr = event_list (&ST (items), event_list_count)
84 153
85#define INFO(class) \ 154#define INFO(class) \
86{ \ 155{ \
87 size_t size; \ 156 size_t size; \
88 SV *sv; \
89 \
90 NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \ 157 NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \
91 sv = sv_2mortal (newSV (size)); \ 158 SV *sv = sv_2mortal (newSV (size)); \
92 SvUPGRADE (sv, SVt_PV); \ 159 SvUPGRADE (sv, SVt_PV); \
93 SvPOK_only (sv); \ 160 SvPOK_only (sv); \
94 SvCUR_set (sv, size); \ 161 SvCUR_set (sv, size); \
95 NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \ 162 NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \
96 XPUSHs (sv); \ 163 XPUSHs (sv); \
97} 164}
98 165
99static void *
100SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
101{
102 if (SvROK (sv) && sv_derived_from (sv, pkg))
103 return (void *)SvIV (SvRV (sv));
104
105 croak ("%s: %s is not of type %s", func, svname, pkg);
106}
107
108static void *
109tmpbuf (size_t size)
110{
111 static void *buf;
112 static size_t len;
113
114 if (len < size)
115 {
116 free (buf);
117 len = ((size + 31) & ~4095) + 4096 - 32;
118 buf = malloc (len);
119 }
120
121 return buf;
122}
123
124MODULE = OpenCL PACKAGE = OpenCL 166MODULE = OpenCL PACKAGE = OpenCL
125 167
126PROTOTYPES: ENABLE 168PROTOTYPES: ENABLE
127 169
128BOOT: 170BOOT:
129{ 171{
130 HV *stash = gv_stashpv ("OpenCL", 1); 172 HV *stash = gv_stashpv ("OpenCL", 1);
131 static const ivstr *civ, const_iv[] = { 173 static const ivstr *civ, const_iv[] = {
132 { sizeof (cl_char ), "SIZEOF_CHAR" }, 174 { sizeof (cl_char ), "SIZEOF_CHAR" },
133 { sizeof (cl_uchar ), "SIZEOF_UCHAR" }, 175 { sizeof (cl_uchar ), "SIZEOF_UCHAR" },
134 { sizeof (cl_short ), "SIZEOF_SHORT" }, 176 { sizeof (cl_short ), "SIZEOF_SHORT" },
135 { sizeof (cl_ushort), "SIZEOF_USHORT"}, 177 { sizeof (cl_ushort), "SIZEOF_USHORT" },
136 { sizeof (cl_int ), "SIZEOF_INT" }, 178 { sizeof (cl_int ), "SIZEOF_INT" },
137 { sizeof (cl_uint ), "SIZEOF_UINT" }, 179 { sizeof (cl_uint ), "SIZEOF_UINT" },
138 { sizeof (cl_long ), "SIZEOF_LONG" }, 180 { sizeof (cl_long ), "SIZEOF_LONG" },
139 { sizeof (cl_ulong ), "SIZEOF_ULONG" }, 181 { sizeof (cl_ulong ), "SIZEOF_ULONG" },
140 { sizeof (cl_half ), "SIZEOF_HALF" }, 182 { sizeof (cl_half ), "SIZEOF_HALF" },
141 { sizeof (cl_float ), "SIZEOF_FLOAT" }, 183 { sizeof (cl_float ), "SIZEOF_FLOAT" },
184 { sizeof (cl_double), "SIZEOF_DOUBLE" },
142#include "constiv.h" 185#include "constiv.h"
143 }; 186 };
144 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--) 187 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--)
145 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv)); 188 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv));
146} 189}
147 190
191cl_int
192errno ()
193 CODE:
194 errno = res;
195
148const char * 196const char *
149err2str (cl_int err) 197err2str (cl_int err)
150 198
151const char * 199const char *
152enum2str (cl_uint value) 200enum2str (cl_uint value)
153 201
154void 202void
155platforms () 203platforms ()
156 PPCODE: 204 PPCODE:
157{
158 cl_platform_id *list; 205 cl_platform_id *list;
159 cl_uint count; 206 cl_uint count;
160 int i; 207 int i;
161 208
162 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count)); 209 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count));
164 NEED_SUCCESS (GetPlatformIDs, (count, list, 0)); 211 NEED_SUCCESS (GetPlatformIDs, (count, list, 0));
165 212
166 EXTEND (SP, count); 213 EXTEND (SP, count);
167 for (i = 0; i < count; ++i) 214 for (i = 0; i < count; ++i)
168 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i])); 215 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i]));
169}
170 216
171void 217void
172context_from_type_simple (cl_device_type type = CL_DEVICE_TYPE_DEFAULT) 218context_from_type (FUTURE properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
173 PPCODE: 219 PPCODE:
174{
175 cl_int res;
176 cl_context ctx = clCreateContextFromType (0, type, 0, 0, &res); 220 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (0, type, 0, 0, &res));
177
178 if (res)
179 FAIL (CreateContextFromType, res);
180
181 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 221 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
182} 222
223void
224context (FUTURE properties, FUTURE devices, FUTURE notify = 0)
225 PPCODE:
226 /* der Gipfel der Kunst */
183 227
184void 228void
185wait_for_events (...) 229wait_for_events (...)
186 CODE: 230 CODE:
187{
188 EVENT_LIST (0, items); 231 EVENT_LIST (0, items);
189 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr)); 232 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr));
190}
191 233
192PROTOTYPES: DISABLE 234PROTOTYPES: DISABLE
193 235
194MODULE = OpenCL PACKAGE = OpenCL::Platform 236MODULE = OpenCL PACKAGE = OpenCL::Platform
195 237
199 INFO (Platform) 241 INFO (Platform)
200 242
201void 243void
202devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL) 244devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL)
203 PPCODE: 245 PPCODE:
204{
205 cl_device_id *list; 246 cl_device_id *list;
206 cl_uint count; 247 cl_uint count;
207 int i; 248 int i;
208 249
209 NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count)); 250 NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count));
211 NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0)); 252 NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0));
212 253
213 EXTEND (SP, count); 254 EXTEND (SP, count);
214 for (i = 0; i < count; ++i) 255 for (i = 0; i < count; ++i)
215 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i])); 256 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i]));
216}
217 257
218void 258void
259context (OpenCL::Platform this, FUTURE properties, SV *devices, FUTURE notify = 0)
260 PPCODE:
261 if (!SvROK (devices) || SvTYPE (SvRV (devices)) != SVt_PVAV)
262 croak ("OpenCL::Platform argument 'device' must be an arrayref with device objects, in call");
263
264 AV *av = (AV *)SvRV (devices);
265 cl_uint num_devices = av_len (av) + 1;
266 cl_device_id *device_list = tmpbuf (sizeof (cl_device_id) * num_devices);
267 int i;
268
269 for (i = num_devices; i--; )
270 device_list [i] = SvPTROBJ ("clCreateContext", "devices", *av_fetch (av, i, 0), "OpenCL::Device");
271
272 NEED_SUCCESS_ARG (cl_context ctx, CreateContext, (0, num_devices, device_list, 0, 0, &res));
273 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
274
275void
219context_from_type_simple (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_DEFAULT) 276context_from_type (OpenCL::Platform this, FUTURE properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
220 PPCODE: 277 PPCODE:
221{
222 cl_int res;
223 cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 }; 278 cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 };
224 cl_context ctx = clCreateContextFromType (props, type, 0, 0, &res); 279 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (props, type, 0, 0, &res));
225
226 if (res)
227 FAIL (CreateContextFromType, res);
228
229 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 280 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
230}
231 281
232MODULE = OpenCL PACKAGE = OpenCL::Device 282MODULE = OpenCL PACKAGE = OpenCL::Device
233 283
234void 284void
235info (OpenCL::Device this, cl_device_info name) 285info (OpenCL::Device this, cl_device_info name)
236 PPCODE: 286 PPCODE:
237 INFO (Device) 287 INFO (Device)
238 288
239void
240context_simple (OpenCL::Device this)
241 PPCODE:
242{
243 cl_int res;
244 cl_context ctx = clCreateContext (0, 1, &this, 0, 0, &res);
245
246 if (res)
247 FAIL (CreateContext, res);
248
249 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
250}
251
252MODULE = OpenCL PACKAGE = OpenCL::Context 289MODULE = OpenCL PACKAGE = OpenCL::Context
253 290
254void 291void
255DESTROY (OpenCL::Context context) 292DESTROY (OpenCL::Context context)
256 CODE: 293 CODE:
260info (OpenCL::Context this, cl_context_info name) 297info (OpenCL::Context this, cl_context_info name)
261 PPCODE: 298 PPCODE:
262 INFO (Context) 299 INFO (Context)
263 300
264void 301void
265command_queue_simple (OpenCL::Context this, OpenCL::Device device) 302queue (OpenCL::Context this, OpenCL::Device device, cl_command_queue_properties properties = 0)
266 PPCODE: 303 PPCODE:
267{
268 cl_int res;
269 cl_command_queue queue = clCreateCommandQueue (this, device, 0, &res); 304 NEED_SUCCESS_ARG (cl_command_queue queue, CreateCommandQueue, (this, device, properties, &res));
270
271 if (res)
272 FAIL (CreateCommandQueue, res);
273
274 XPUSH_NEW_OBJ ("OpenCL::Queue", queue); 305 XPUSH_NEW_OBJ ("OpenCL::Queue", queue);
275} 306
307void
308user_event (OpenCL::Context this)
309 PPCODE:
310 NEED_SUCCESS_ARG (cl_event ev, CreateUserEvent, (this, &res));
311 XPUSH_NEW_OBJ ("OpenCL::UserEvent", ev);
276 312
277void 313void
278buffer (OpenCL::Context this, cl_mem_flags flags, size_t len) 314buffer (OpenCL::Context this, cl_mem_flags flags, size_t len)
279 PPCODE: 315 PPCODE:
280{
281 cl_int res;
282 cl_mem mem;
283
284 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)) 316 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))
285 croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?"); 317 croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?");
286 318
287 mem = clCreateBuffer (this, flags, len, 0, &res); 319 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (this, flags, len, 0, &res));
288
289 if (res)
290 FAIL (CreateBuffer, res);
291
292 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); 320 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
293}
294 321
295void 322void
296buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data) 323buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data)
297 PPCODE: 324 PPCODE:
298{
299 STRLEN len; 325 STRLEN len;
300 char *ptr = SvPVbyte (data, len); 326 char *ptr = SvPVbyte (data, len);
301 cl_int res;
302 cl_mem mem;
303 327
304 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) 328 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)))
305 croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?"); 329 croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?");
306 330
307 mem = clCreateBuffer (this, flags, len, ptr, &res); 331 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (this, flags, len, ptr, &res));
308
309 if (res)
310 FAIL (CreateBuffer, res);
311
312 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); 332 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
313}
314 333
315void 334void
316image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, SV *data) 335image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t row_pitch, SV *data)
317 PPCODE: 336 PPCODE:
318{
319 STRLEN len; 337 STRLEN len;
320 char *ptr = SvPVbyte (data, len); 338 char *ptr = SvPVbyte (data, len);
321 const cl_image_format format = { channel_order, channel_type }; 339 const cl_image_format format = { channel_order, channel_type };
322 cl_int res;
323 cl_mem mem = clCreateImage2D (this, flags, &format, width, height, len / height, ptr, &res); 340 NEED_SUCCESS_ARG (cl_mem mem, CreateImage2D, (this, flags, &format, width, height, row_pitch, ptr, &res));
324
325 if (res)
326 FAIL (CreateImage2D, res);
327
328 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem); 341 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
329}
330 342
331void 343void
332image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t slice_pitch, SV *data) 344image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data)
333 PPCODE: 345 PPCODE:
334{
335 STRLEN len; 346 STRLEN len;
336 char *ptr = SvPVbyte (data, len); 347 char *ptr = SvPVbyte (data, len);
337 const cl_image_format format = { channel_order, channel_type }; 348 const cl_image_format format = { channel_order, channel_type };
338 cl_int res; 349 NEED_SUCCESS_ARG (cl_mem mem, CreateImage3D, (this, flags, &format, width, height, depth, row_pitch, slice_pitch, ptr, &res));
339 cl_mem mem = clCreateImage3D (this, flags, &format, width, height,
340 depth, len / (height * slice_pitch), slice_pitch, ptr, &res);
341
342 if (res)
343 FAIL (CreateImage3D, res);
344
345 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem); 350 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
346}
347 351
348void 352void
349supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type) 353supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type)
350 PPCODE: 354 PPCODE:
351{ 355{
368} 372}
369 373
370void 374void
371sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode) 375sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode)
372 PPCODE: 376 PPCODE:
373{
374 cl_int res;
375 cl_sampler sampler = clCreateSampler (this, normalized_coords, addressing_mode, filter_mode, &res); 377 NEED_SUCCESS_ARG (cl_sampler sampler, CreateSampler, (this, normalized_coords, addressing_mode, filter_mode, &res));
376
377 if (res)
378 FAIL (CreateSampler, res);
379
380 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler); 378 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler);
381}
382 379
383void 380void
384program_with_source (OpenCL::Context this, SV *program) 381program_with_source (OpenCL::Context this, SV *program)
385 PPCODE: 382 PPCODE:
386{
387 STRLEN len; 383 STRLEN len;
388 size_t len2; 384 size_t len2;
389 const char *ptr = SvPVbyte (program, len); 385 const char *ptr = SvPVbyte (program, len);
390 cl_int res;
391 cl_program prog;
392 386
393 len2 = len; 387 len2 = len;
394 prog = clCreateProgramWithSource (this, 1, &ptr, &len2, &res); 388 NEED_SUCCESS_ARG (cl_program prog, CreateProgramWithSource, (this, 1, &ptr, &len2, &res));
395
396 if (res)
397 FAIL (CreateProgramWithSource, res);
398
399 XPUSH_NEW_OBJ ("OpenCL::Program", prog); 389 XPUSH_NEW_OBJ ("OpenCL::Program", prog);
400}
401 390
402MODULE = OpenCL PACKAGE = OpenCL::Queue 391MODULE = OpenCL PACKAGE = OpenCL::Queue
403 392
404void 393void
405DESTROY (OpenCL::Queue this) 394DESTROY (OpenCL::Queue this)
412 INFO (CommandQueue) 401 INFO (CommandQueue)
413 402
414void 403void
415enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...) 404enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...)
416 PPCODE: 405 PPCODE:
417{
418 cl_event ev = 0; 406 cl_event ev = 0;
419 EVENT_LIST (6, items - 6); 407 EVENT_LIST (6, items - 6);
420 408
421 SvUPGRADE (data, SVt_PV); 409 SvUPGRADE (data, SVt_PV);
422 SvGROW (data, len); 410 SvGROW (data, len);
424 SvCUR_set (data, len); 412 SvCUR_set (data, len);
425 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 413 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
426 414
427 if (ev) 415 if (ev)
428 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 416 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
429}
430 417
431void 418void
432enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...) 419enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...)
433 PPCODE: 420 PPCODE:
434{
435 cl_event ev = 0; 421 cl_event ev = 0;
436 STRLEN len; 422 STRLEN len;
437 char *ptr = SvPVbyte (data, len); 423 char *ptr = SvPVbyte (data, len);
438 EVENT_LIST (5, items - 5); 424 EVENT_LIST (5, items - 5);
439 425
440 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 426 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
441 427
442 if (ev) 428 if (ev)
443 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 429 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
444}
445 430
446void 431void
447enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...) 432enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...)
448 PPCODE: 433 PPCODE:
449{
450 cl_event ev = 0; 434 cl_event ev = 0;
451 EVENT_LIST (6, items - 6); 435 EVENT_LIST (6, items - 6);
452 436
453 NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 437 NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
454 438
455 if (ev) 439 if (ev)
456 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 440 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
457}
458
459 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueReadBufferRect.html */
460 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWriteBufferRect.html */
461 441
462void 442void
463enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...) 443enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
464 PPCODE: 444 PPCODE:
465{
466 cl_event ev = 0; 445 cl_event ev = 0;
467 const size_t src_origin[3] = { src_x, src_y, src_z }; 446 const size_t src_origin[3] = { src_x, src_y, src_z };
468 const size_t region[3] = { width, height, depth }; 447 const size_t region[3] = { width, height, depth };
469 size_t len = row_pitch * slice_pitch * depth;
470 EVENT_LIST (11, items - 11); 448 EVENT_LIST (12, items - 12);
449
450 if (!row_pitch)
451 row_pitch = img_row_pitch (src);
452
453 if (depth > 1 && !slice_pitch)
454 slice_pitch = row_pitch * height;
455
456 size_t len = slice_pitch ? slice_pitch * depth : row_pitch * height;
471 457
472 SvUPGRADE (data, SVt_PV); 458 SvUPGRADE (data, SVt_PV);
473 SvGROW (data, len); 459 SvGROW (data, len);
474 SvPOK_only (data); 460 SvPOK_only (data);
475 SvCUR_set (data, len); 461 SvCUR_set (data, len);
476 NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 462 NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
477 463
478 if (ev) 464 if (ev)
479 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 465 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
480}
481 466
482void 467void
483enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, SV *data, ...) 468enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
484 PPCODE: 469 PPCODE:
485{
486 cl_event ev = 0; 470 cl_event ev = 0;
487 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 471 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
488 const size_t region[3] = { width, height, depth }; 472 const size_t region[3] = { width, height, depth };
489 STRLEN len; 473 STRLEN len;
490 char *ptr = SvPVbyte (data, len); 474 char *ptr = SvPVbyte (data, len);
491 size_t slice_pitch = len / (row_pitch * height);
492 EVENT_LIST (11, items - 11); 475 EVENT_LIST (12, items - 12);
476
477 if (!row_pitch)
478 row_pitch = img_row_pitch (dst);
479
480 if (depth > 1 && !slice_pitch)
481 slice_pitch = row_pitch * height;
482
483 size_t min_len = slice_pitch ? slice_pitch * depth : row_pitch * height;
484
485 if (len < min_len)
486 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred");
493 487
494 NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 488 NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
495 489
496 if (ev) 490 if (ev)
497 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 491 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
498}
499 492
500void 493void
501enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...) 494enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...)
502 PPCODE: 495 PPCODE:
503{
504 cl_event ev = 0; 496 cl_event ev = 0;
505 const size_t src_origin[3] = { src_x, src_y, src_z }; 497 const size_t src_origin[3] = { src_x, src_y, src_z };
506 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 498 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
507 const size_t region[3] = { width, height, depth }; 499 const size_t region[3] = { width, height, depth };
508 EVENT_LIST (16, items - 16); 500 EVENT_LIST (16, items - 16);
509 501
510 NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 502 NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
511 503
512 if (ev) 504 if (ev)
513 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 505 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
514}
515 506
516void 507void
517enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) 508enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
518 PPCODE: 509 PPCODE:
519{
520 cl_event ev = 0; 510 cl_event ev = 0;
521 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 511 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
522 const size_t region[3] = { width, height, depth }; 512 const size_t region[3] = { width, height, depth };
523 EVENT_LIST (10, items - 10); 513 EVENT_LIST (10, items - 10);
524 514
525 NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 515 NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
526 516
527 if (ev) 517 if (ev)
528 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 518 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
529}
530 519
531void 520void
532enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) 521enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Image dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
533 PPCODE: 522 PPCODE:
534{
535 cl_event ev = 0; 523 cl_event ev = 0;
536 const size_t src_origin[3] = { src_x, src_y, src_z }; 524 const size_t src_origin[3] = { src_x, src_y, src_z };
537 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 525 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
538 const size_t region[3] = { width, height, depth }; 526 const size_t region[3] = { width, height, depth };
539 EVENT_LIST (12, items - 12); 527 EVENT_LIST (12, items - 12);
540 528
541 NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 529 NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
542 530
543 if (ev) 531 if (ev)
544 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 532 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
545}
546 533
547void 534void
548enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...) 535enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...)
549 PPCODE: 536 PPCODE:
550{
551 cl_event ev = 0; 537 cl_event ev = 0;
552 const size_t src_origin[3] = { src_x, src_y, src_z }; 538 const size_t src_origin[3] = { src_x, src_y, src_z };
553 const size_t region[3] = { width, height, depth }; 539 const size_t region[3] = { width, height, depth };
554 EVENT_LIST (10, items - 10); 540 EVENT_LIST (10, items - 10);
555 541
556 NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 542 NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
557 543
558 if (ev) 544 if (ev)
559 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 545 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
560}
561 546
562void 547void
563enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...) 548enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...)
564 PPCODE: 549 PPCODE:
565{
566 cl_event ev = 0; 550 cl_event ev = 0;
567 EVENT_LIST (2, items - 2); 551 EVENT_LIST (2, items - 2);
568 552
569 NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 553 NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
570 554
571 if (ev) 555 if (ev)
572 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 556 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
573}
574 557
575void 558void
576enqueue_nd_range_kernel (OpenCL::Queue this, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...) 559enqueue_nd_range_kernel (OpenCL::Queue this, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...)
577 PPCODE: 560 PPCODE:
578{
579 cl_event ev = 0; 561 cl_event ev = 0;
580 size_t *gwo = 0, *gws, *lws = 0; 562 size_t *gwo = 0, *gws, *lws = 0;
581 int gws_len; 563 int gws_len;
582 size_t *lists; 564 size_t *lists;
583 int i; 565 int i;
584 EVENT_LIST (2, items - 2); 566 EVENT_LIST (5, items - 5);
585 567
586 if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV) 568 if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV)
587 croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference"); 569 croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference");
588 570
589 gws_len = AvFILLp (SvRV (global_work_size)) + 1; 571 gws_len = AvFILLp (SvRV (global_work_size)) + 1;
622 604
623 NEED_SUCCESS (EnqueueNDRangeKernel, (this, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 605 NEED_SUCCESS (EnqueueNDRangeKernel, (this, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
624 606
625 if (ev) 607 if (ev)
626 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 608 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
627}
628 609
629void 610void
630enqueue_marker (OpenCL::Queue this) 611enqueue_marker (OpenCL::Queue this)
631 PPCODE: 612 PPCODE:
632{
633 cl_event ev; 613 cl_event ev;
634 NEED_SUCCESS (EnqueueMarker, (this, &ev)); 614 NEED_SUCCESS (EnqueueMarker, (this, &ev));
635 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 615 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
636}
637 616
638void 617void
639enqueue_wait_for_events (OpenCL::Queue this, ...) 618enqueue_wait_for_events (OpenCL::Queue this, ...)
640 CODE: 619 CODE:
641{
642 EVENT_LIST (1, items - 1); 620 EVENT_LIST (1, items - 1);
643 NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr)); 621 NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr));
644}
645 622
646void 623void
647enqueue_barrier (OpenCL::Queue this) 624enqueue_barrier (OpenCL::Queue this)
648 CODE: 625 CODE:
649 NEED_SUCCESS (EnqueueBarrier, (this)); 626 NEED_SUCCESS (EnqueueBarrier, (this));
700 NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0)); 677 NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0));
701 678
702void 679void
703build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name) 680build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name)
704 PPCODE: 681 PPCODE:
705{
706 size_t size; 682 size_t size;
707 SV *sv;
708
709 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size)); 683 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size));
710 sv = sv_2mortal (newSV (size)); 684 SV *sv = sv_2mortal (newSV (size));
711 SvUPGRADE (sv, SVt_PV); 685 SvUPGRADE (sv, SVt_PV);
712 SvPOK_only (sv); 686 SvPOK_only (sv);
713 SvCUR_set (sv, size); 687 SvCUR_set (sv, size);
714 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0)); 688 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0));
715 XPUSHs (sv); 689 XPUSHs (sv);
716}
717 690
718void 691void
719kernel (OpenCL::Program program, SV *function) 692kernel (OpenCL::Program program, SV *function)
720 PPCODE: 693 PPCODE:
721{
722 cl_int res;
723 cl_kernel kernel = clCreateKernel (program, SvPVbyte_nolen (function), &res); 694 NEED_SUCCESS_ARG (cl_kernel kernel, CreateKernel, (program, SvPVbyte_nolen (function), &res));
724
725 if (res)
726 FAIL (CreateKernel, res);
727
728 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel); 695 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel);
729}
730 696
731MODULE = OpenCL PACKAGE = OpenCL::Kernel 697MODULE = OpenCL PACKAGE = OpenCL::Kernel
732 698
733void 699void
734DESTROY (OpenCL::Kernel this) 700DESTROY (OpenCL::Kernel this)
789set_float (OpenCL::Kernel this, cl_uint idx, cl_float value) 755set_float (OpenCL::Kernel this, cl_uint idx, cl_float value)
790 CODE: 756 CODE:
791 clSetKernelArg (this, idx, sizeof (value), &value); 757 clSetKernelArg (this, idx, sizeof (value), &value);
792 758
793void 759void
760set_double (OpenCL::Kernel this, cl_uint idx, cl_double value)
761 CODE:
762 clSetKernelArg (this, idx, sizeof (value), &value);
763
764void
794set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value) 765set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value)
795 CODE: 766 CODE:
796 clSetKernelArg (this, idx, sizeof (value), &value); 767 clSetKernelArg (this, idx, sizeof (value), &value);
797 768
798void 769void
835void 806void
836wait (OpenCL::Event this) 807wait (OpenCL::Event this)
837 CODE: 808 CODE:
838 clWaitForEvents (1, &this); 809 clWaitForEvents (1, &this);
839 810
811MODULE = OpenCL PACKAGE = OpenCL::UserEvent
812
813void
814set_status (OpenCL::UserEvent this, cl_int execution_status)
815 CODE:
816 clSetUserEventStatus (this, execution_status);
817

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines