ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/OpenCL/OpenCL.xs
(Generate patch)

Comparing OpenCL/OpenCL.xs (file contents):
Revision 1.4 by root, Tue Nov 15 21:13:42 2011 UTC vs.
Revision 1.10 by root, Thu Nov 17 03:56:07 2011 UTC

20typedef cl_mem OpenCL__Image3D_ornull; 20typedef cl_mem OpenCL__Image3D_ornull;
21typedef cl_sampler OpenCL__Sampler; 21typedef cl_sampler OpenCL__Sampler;
22typedef cl_program OpenCL__Program; 22typedef cl_program OpenCL__Program;
23typedef cl_kernel OpenCL__Kernel; 23typedef cl_kernel OpenCL__Kernel;
24typedef cl_event OpenCL__Event; 24typedef cl_event OpenCL__Event;
25typedef cl_event OpenCL__UserEvent;
26
27typedef SV *FUTURE;
28
29/*****************************************************************************/
30
31/* up to two temporary buffers */
32static void *
33tmpbuf (size_t size)
34{
35 static int idx;
36 static void *buf [2];
37 static size_t len [2];
38
39 idx ^= 1;
40
41 if (len [idx] < size)
42 {
43 free (buf [idx]);
44 len [idx] = ((size + 31) & ~4095) + 4096 - 32;
45 buf [idx] = malloc (len [idx]);
46 }
47
48 return buf [idx];
49}
50
51/*****************************************************************************/
25 52
26typedef struct 53typedef struct
27{ 54{
28 IV iv; 55 IV iv;
29 const char *name; 56 const char *name;
63 }; 90 };
64 91
65 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)"); 92 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)");
66} 93}
67 94
95/*****************************************************************************/
96
97static cl_int res;
98
68#define FAIL(name,res) \ 99#define FAIL(name) \
69 croak ("cl" # name ": %s", err2str (res)); 100 croak ("cl" # name ": %s", err2str (res));
70 101
71#define NEED_SUCCESS(name,args) \ 102#define NEED_SUCCESS(name,args) \
72 do { \ 103 do { \
73 cl_int res = cl ## name args; \ 104 res = cl ## name args; \
74 \ 105 \
75 if (res) \ 106 if (res) \
76 FAIL (name, res); \ 107 FAIL (name); \
77 } while (0) 108 } while (0)
109
110#define NEED_SUCCESS_ARG(retdecl, name, args) \
111 retdecl = cl ## name args; \
112 if (res) \
113 FAIL (name);
114
115/*****************************************************************************/
78 116
79#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr) 117#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr)
80#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr)) 118#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr))
81 119
82/*TODO*/ 120static void *
83#define EVENT_LIST(items,count) cl_uint event_list_count = 0; cl_event *event_list_ptr = 0 121SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
122{
123 if (SvROK (sv) && sv_derived_from (sv, pkg))
124 return (void *)SvIV (SvRV (sv));
125
126 croak ("%s: %s is not of type %s", func, svname, pkg);
127}
128
129/*****************************************************************************/
130
131static cl_event *
132event_list (SV **items, int count)
133{
134 cl_event *list = tmpbuf (sizeof (cl_event) * count);
135
136 while (count--)
137 list [count] = SvPTROBJ ("clEnqueue", "wait_events", items [count], "OpenCL::Event");
138
139 return list;
140}
141
142#define EVENT_LIST(items,count) \
143 cl_uint event_list_count = (count); \
144 cl_event *event_list_ptr = event_list (&ST (items), event_list_count)
84 145
85#define INFO(class) \ 146#define INFO(class) \
86{ \ 147{ \
87 size_t size; \ 148 size_t size; \
88 SV *sv; \
89 \
90 NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \ 149 NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \
91 sv = sv_2mortal (newSV (size)); \ 150 SV *sv = sv_2mortal (newSV (size)); \
92 SvUPGRADE (sv, SVt_PV); \ 151 SvUPGRADE (sv, SVt_PV); \
93 SvPOK_only (sv); \ 152 SvPOK_only (sv); \
94 SvCUR_set (sv, size); \ 153 SvCUR_set (sv, size); \
95 NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \ 154 NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \
96 XPUSHs (sv); \ 155 XPUSHs (sv); \
97} 156}
98 157
99static void *
100SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
101{
102 if (SvROK (sv) && sv_derived_from (sv, pkg))
103 return (void *)SvIV (SvRV (sv));
104
105 croak ("%s: %s is not of type %s", func, svname, pkg);
106}
107
108static void *
109tmpbuf (size_t size)
110{
111 static void *buf;
112 static size_t len;
113
114 if (len < size)
115 {
116 free (buf);
117 len = ((size + 31) & ~4095) + 4096 - 32;
118 buf = malloc (len);
119 }
120
121 return buf;
122}
123
124MODULE = OpenCL PACKAGE = OpenCL 158MODULE = OpenCL PACKAGE = OpenCL
125 159
126PROTOTYPES: ENABLE 160PROTOTYPES: ENABLE
127 161
128BOOT: 162BOOT:
129{ 163{
130 HV *stash = gv_stashpv ("OpenCL", 1); 164 HV *stash = gv_stashpv ("OpenCL", 1);
131 static const ivstr *civ, const_iv[] = { 165 static const ivstr *civ, const_iv[] = {
132 { sizeof (cl_char ), "SIZEOF_CHAR" }, 166 { sizeof (cl_char ), "SIZEOF_CHAR" },
133 { sizeof (cl_uchar ), "SIZEOF_UCHAR" }, 167 { sizeof (cl_uchar ), "SIZEOF_UCHAR" },
134 { sizeof (cl_short ), "SIZEOF_SHORT" }, 168 { sizeof (cl_short ), "SIZEOF_SHORT" },
135 { sizeof (cl_ushort), "SIZEOF_USHORT"}, 169 { sizeof (cl_ushort), "SIZEOF_USHORT" },
136 { sizeof (cl_int ), "SIZEOF_INT" }, 170 { sizeof (cl_int ), "SIZEOF_INT" },
137 { sizeof (cl_uint ), "SIZEOF_UINT" }, 171 { sizeof (cl_uint ), "SIZEOF_UINT" },
138 { sizeof (cl_long ), "SIZEOF_LONG" }, 172 { sizeof (cl_long ), "SIZEOF_LONG" },
139 { sizeof (cl_ulong ), "SIZEOF_ULONG" }, 173 { sizeof (cl_ulong ), "SIZEOF_ULONG" },
140 { sizeof (cl_half ), "SIZEOF_HALF" }, 174 { sizeof (cl_half ), "SIZEOF_HALF" },
141 { sizeof (cl_float ), "SIZEOF_FLOAT" }, 175 { sizeof (cl_float ), "SIZEOF_FLOAT" },
176 { sizeof (cl_double), "SIZEOF_DOUBLE" },
142#include "constiv.h" 177#include "constiv.h"
143 }; 178 };
144 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--) 179 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--)
145 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv)); 180 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv));
146} 181}
147 182
183cl_int
184errno ()
185 CODE:
186 errno = res;
187
148const char * 188const char *
149err2str (cl_int err) 189err2str (cl_int err)
150 190
151const char * 191const char *
152enum2str (cl_uint value) 192enum2str (cl_uint value)
153 193
154void 194void
155platforms () 195platforms ()
156 PPCODE: 196 PPCODE:
157{
158 cl_platform_id *list; 197 cl_platform_id *list;
159 cl_uint count; 198 cl_uint count;
160 int i; 199 int i;
161 200
162 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count)); 201 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count));
164 NEED_SUCCESS (GetPlatformIDs, (count, list, 0)); 203 NEED_SUCCESS (GetPlatformIDs, (count, list, 0));
165 204
166 EXTEND (SP, count); 205 EXTEND (SP, count);
167 for (i = 0; i < count; ++i) 206 for (i = 0; i < count; ++i)
168 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i])); 207 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i]));
169}
170 208
171void 209void
172context_from_type_simple (cl_device_type type = CL_DEVICE_TYPE_DEFAULT) 210context_from_type (FUTURE properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
173 PPCODE: 211 PPCODE:
174{
175 cl_int res;
176 cl_context ctx = clCreateContextFromType (0, type, 0, 0, &res); 212 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (0, type, 0, 0, &res));
177
178 if (res)
179 FAIL (CreateContextFromType, res);
180
181 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 213 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
182} 214
215void
216context (FUTURE properties, FUTURE devices, FUTURE notify = 0)
217 PPCODE:
218 /* der Gipfel der Kunst */
183 219
184void 220void
185wait_for_events (...) 221wait_for_events (...)
186 CODE: 222 CODE:
187{
188 EVENT_LIST (0, items); 223 EVENT_LIST (0, items);
189 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr)); 224 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr));
190}
191 225
192PROTOTYPES: DISABLE 226PROTOTYPES: DISABLE
193 227
194MODULE = OpenCL PACKAGE = OpenCL::Platform 228MODULE = OpenCL PACKAGE = OpenCL::Platform
195 229
199 INFO (Platform) 233 INFO (Platform)
200 234
201void 235void
202devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL) 236devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL)
203 PPCODE: 237 PPCODE:
204{
205 cl_device_id *list; 238 cl_device_id *list;
206 cl_uint count; 239 cl_uint count;
207 int i; 240 int i;
208 241
209 NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count)); 242 NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count));
211 NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0)); 244 NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0));
212 245
213 EXTEND (SP, count); 246 EXTEND (SP, count);
214 for (i = 0; i < count; ++i) 247 for (i = 0; i < count; ++i)
215 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i])); 248 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i]));
216}
217 249
218void 250void
251context (OpenCL::Platform this, FUTURE properties, SV *devices, FUTURE notify = 0)
252 PPCODE:
253 if (!SvROK (devices) || SvTYPE (SvRV (devices)) != SVt_PVAV)
254 croak ("OpenCL::Platform argument 'device' must be an arrayref with device objects, in call");
255
256 AV *av = (SV *)SvRV (devices);
257 cl_uint num_devices = av_len (av) + 1;
258 cl_device_id *device_list = tmpbuf (sizeof (cl_device_id) * num_devices);
259 int i;
260
261 for (i = num_devices; i--; )
262 device_list [i] = SvPTROBJ ("clCreateContext", "devices", *av_fetch (av, i, 0), "OpenCL::Device");
263
264 NEED_SUCCESS_ARG (cl_context ctx, CreateContext, (0, num_devices, device_list, 0, 0, &res));
265 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
266
267void
219context_from_type_simple (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_DEFAULT) 268context_from_type (OpenCL::Platform this, FUTURE properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
220 PPCODE: 269 PPCODE:
221{
222 cl_int res;
223 cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 }; 270 cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 };
224 cl_context ctx = clCreateContextFromType (props, type, 0, 0, &res); 271 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (props, type, 0, 0, &res));
225
226 if (res)
227 FAIL (CreateContextFromType, res);
228
229 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 272 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
230}
231 273
232MODULE = OpenCL PACKAGE = OpenCL::Device 274MODULE = OpenCL PACKAGE = OpenCL::Device
233 275
234void 276void
235info (OpenCL::Device this, cl_device_info name) 277info (OpenCL::Device this, cl_device_info name)
236 PPCODE: 278 PPCODE:
237 INFO (Device) 279 INFO (Device)
238 280
239void
240context_simple (OpenCL::Device this)
241 PPCODE:
242{
243 cl_int res;
244 cl_context ctx = clCreateContext (0, 1, &this, 0, 0, &res);
245
246 if (res)
247 FAIL (CreateContext, res);
248
249 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
250}
251
252MODULE = OpenCL PACKAGE = OpenCL::Context 281MODULE = OpenCL PACKAGE = OpenCL::Context
253 282
254void 283void
255DESTROY (OpenCL::Context context) 284DESTROY (OpenCL::Context context)
256 CODE: 285 CODE:
260info (OpenCL::Context this, cl_context_info name) 289info (OpenCL::Context this, cl_context_info name)
261 PPCODE: 290 PPCODE:
262 INFO (Context) 291 INFO (Context)
263 292
264void 293void
265command_queue_simple (OpenCL::Context this, OpenCL::Device device) 294queue (OpenCL::Context this, OpenCL::Device device, cl_command_queue_properties properties = 0)
266 PPCODE: 295 PPCODE:
267{
268 cl_int res;
269 cl_command_queue queue = clCreateCommandQueue (this, device, 0, &res); 296 NEED_SUCCESS_ARG (cl_command_queue queue, CreateCommandQueue, (this, device, properties, &res));
270
271 if (res)
272 FAIL (CreateCommandQueue, res);
273
274 XPUSH_NEW_OBJ ("OpenCL::Queue", queue); 297 XPUSH_NEW_OBJ ("OpenCL::Queue", queue);
275} 298
299void
300user_event (OpenCL::Context this)
301 PPCODE:
302 NEED_SUCCESS_ARG (cl_event ev, CreateUserEvent, (this, &res));
303 XPUSH_NEW_OBJ ("OpenCL::UserEvent", ev);
276 304
277void 305void
278buffer (OpenCL::Context this, cl_mem_flags flags, size_t len) 306buffer (OpenCL::Context this, cl_mem_flags flags, size_t len)
279 PPCODE: 307 PPCODE:
280{
281 cl_int res;
282 cl_mem mem;
283
284 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)) 308 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))
285 croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?"); 309 croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?");
286 310
287 mem = clCreateBuffer (this, flags, len, 0, &res); 311 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (this, flags, len, 0, &res));
288
289 if (res)
290 FAIL (CreateBuffer, res);
291
292 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); 312 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
293}
294 313
295void 314void
296buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data) 315buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data)
297 PPCODE: 316 PPCODE:
298{
299 STRLEN len; 317 STRLEN len;
300 char *ptr = SvPVbyte (data, len); 318 char *ptr = SvPVbyte (data, len);
301 cl_int res;
302 cl_mem mem;
303 319
304 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) 320 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)))
305 croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?"); 321 croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?");
306 322
307 mem = clCreateBuffer (this, flags, len, ptr, &res); 323 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (this, flags, len, ptr, &res));
308
309 if (res)
310 FAIL (CreateBuffer, res);
311
312 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); 324 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
313}
314 325
315void 326void
316image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, SV *data) 327image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t row_pitch, SV *data)
317 PPCODE: 328 PPCODE:
318{
319 STRLEN len; 329 STRLEN len;
320 char *ptr = SvPVbyte (data, len); 330 char *ptr = SvPVbyte (data, len);
321 const cl_image_format format = { channel_order, channel_type }; 331 const cl_image_format format = { channel_order, channel_type };
322 cl_int res;
323 cl_mem mem = clCreateImage2D (this, flags, &format, width, height, len / height, ptr, &res); 332 NEED_SUCCESS_ARG (cl_mem mem, CreateImage2D, (this, flags, &format, width, height, row_pitch, ptr, &res));
324
325 if (res)
326 FAIL (CreateImage2D, res);
327
328 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem); 333 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
329}
330 334
331void 335void
332image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t slice_pitch, SV *data) 336image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data)
333 PPCODE: 337 PPCODE:
334{
335 STRLEN len; 338 STRLEN len;
336 char *ptr = SvPVbyte (data, len); 339 char *ptr = SvPVbyte (data, len);
337 const cl_image_format format = { channel_order, channel_type }; 340 const cl_image_format format = { channel_order, channel_type };
338 cl_int res; 341 NEED_SUCCESS_ARG (cl_mem mem, CreateImage3D, (this, flags, &format, width, height, depth, row_pitch, slice_pitch, ptr, &res));
339 cl_mem mem = clCreateImage3D (this, flags, &format, width, height,
340 depth, len / (height * slice_pitch), slice_pitch, ptr, &res);
341
342 if (res)
343 FAIL (CreateImage3D, res);
344
345 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem); 342 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
346}
347 343
348void 344void
349supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type) 345supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type)
350 PPCODE: 346 PPCODE:
351{ 347{
368} 364}
369 365
370void 366void
371sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode) 367sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode)
372 PPCODE: 368 PPCODE:
373{
374 cl_int res;
375 cl_sampler sampler = clCreateSampler (this, normalized_coords, addressing_mode, filter_mode, &res); 369 NEED_SUCCESS_ARG (cl_sampler sampler, CreateSampler, (this, normalized_coords, addressing_mode, filter_mode, &res));
376
377 if (res)
378 FAIL (CreateSampler, res);
379
380 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler); 370 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler);
381}
382 371
383void 372void
384program_with_source (OpenCL::Context this, SV *program) 373program_with_source (OpenCL::Context this, SV *program)
385 PPCODE: 374 PPCODE:
386{
387 STRLEN len; 375 STRLEN len;
388 size_t len2; 376 size_t len2;
389 const char *ptr = SvPVbyte (program, len); 377 const char *ptr = SvPVbyte (program, len);
390 cl_int res;
391 cl_program prog;
392 378
393 len2 = len; 379 len2 = len;
394 prog = clCreateProgramWithSource (this, 1, &ptr, &len2, &res); 380 NEED_SUCCESS_ARG (cl_program prog, CreateProgramWithSource, (this, 1, &ptr, &len2, &res));
395
396 if (res)
397 FAIL (CreateProgramWithSource, res);
398
399 XPUSH_NEW_OBJ ("OpenCL::Program", prog); 381 XPUSH_NEW_OBJ ("OpenCL::Program", prog);
400}
401 382
402MODULE = OpenCL PACKAGE = OpenCL::Queue 383MODULE = OpenCL PACKAGE = OpenCL::Queue
403 384
404void 385void
405DESTROY (OpenCL::Queue this) 386DESTROY (OpenCL::Queue this)
412 INFO (CommandQueue) 393 INFO (CommandQueue)
413 394
414void 395void
415enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...) 396enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...)
416 PPCODE: 397 PPCODE:
417{
418 cl_event ev = 0; 398 cl_event ev = 0;
419 EVENT_LIST (6, items - 6); 399 EVENT_LIST (6, items - 6);
420 400
421 SvUPGRADE (data, SVt_PV); 401 SvUPGRADE (data, SVt_PV);
422 SvGROW (data, len); 402 SvGROW (data, len);
424 SvCUR_set (data, len); 404 SvCUR_set (data, len);
425 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 405 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
426 406
427 if (ev) 407 if (ev)
428 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 408 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
429}
430 409
431void 410void
432enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...) 411enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...)
433 PPCODE: 412 PPCODE:
434{
435 cl_event ev = 0; 413 cl_event ev = 0;
436 STRLEN len; 414 STRLEN len;
437 char *ptr = SvPVbyte (data, len); 415 char *ptr = SvPVbyte (data, len);
438 EVENT_LIST (5, items - 5); 416 EVENT_LIST (5, items - 5);
439 417
440 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 418 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
441 419
442 if (ev) 420 if (ev)
443 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 421 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
444}
445 422
446void 423void
447enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...) 424enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...)
448 PPCODE: 425 PPCODE:
449{
450 cl_event ev = 0; 426 cl_event ev = 0;
451 EVENT_LIST (6, items - 6); 427 EVENT_LIST (6, items - 6);
452 428
453 NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 429 NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
454 430
455 if (ev) 431 if (ev)
456 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 432 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
457}
458 433
459 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueReadBufferRect.html */ 434 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueReadBufferRect.html */
460 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWriteBufferRect.html */ 435 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWriteBufferRect.html */
461 436
462void 437void
463enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...) 438enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
464 PPCODE: 439 PPCODE:
465{
466 cl_event ev = 0; 440 cl_event ev = 0;
467 const size_t src_origin[3] = { src_x, src_y, src_z }; 441 const size_t src_origin[3] = { src_x, src_y, src_z };
468 const size_t region[3] = { width, height, depth }; 442 const size_t region[3] = { width, height, depth };
469 size_t len = row_pitch * slice_pitch * depth; 443 size_t len = row_pitch * (slice_pitch ? slice_pitch : 1) * depth;
470 EVENT_LIST (11, items - 11); 444 EVENT_LIST (12, items - 12);
445
446 if (!len)
447 croak ("enqueue_read_image: currently, row_pitch must be specified to be non-zero");
471 448
472 SvUPGRADE (data, SVt_PV); 449 SvUPGRADE (data, SVt_PV);
473 SvGROW (data, len); 450 SvGROW (data, len);
474 SvPOK_only (data); 451 SvPOK_only (data);
475 SvCUR_set (data, len); 452 SvCUR_set (data, len);
476 NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 453 NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
477 454
478 if (ev) 455 if (ev)
479 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 456 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
480}
481 457
482void 458void
483enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, SV *data, ...) 459enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
484 PPCODE: 460 PPCODE:
485{
486 cl_event ev = 0; 461 cl_event ev = 0;
487 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 462 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
488 const size_t region[3] = { width, height, depth }; 463 const size_t region[3] = { width, height, depth };
489 STRLEN len; 464 STRLEN len;
490 char *ptr = SvPVbyte (data, len); 465 char *ptr = SvPVbyte (data, len);
491 size_t slice_pitch = len / (row_pitch * height);
492 EVENT_LIST (11, items - 11); 466 EVENT_LIST (12, items - 12);
493 467
494 NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 468 NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
495 469
496 if (ev) 470 if (ev)
497 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 471 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
498}
499 472
500void 473void
501enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...) 474enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...)
502 PPCODE: 475 PPCODE:
503{
504 cl_event ev = 0; 476 cl_event ev = 0;
505 const size_t src_origin[3] = { src_x, src_y, src_z }; 477 const size_t src_origin[3] = { src_x, src_y, src_z };
506 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 478 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
507 const size_t region[3] = { width, height, depth }; 479 const size_t region[3] = { width, height, depth };
508 EVENT_LIST (16, items - 16); 480 EVENT_LIST (16, items - 16);
509 481
510 NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 482 NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
511 483
512 if (ev) 484 if (ev)
513 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 485 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
514}
515 486
516void 487void
517enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) 488enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
518 PPCODE: 489 PPCODE:
519{
520 cl_event ev = 0; 490 cl_event ev = 0;
521 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 491 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
522 const size_t region[3] = { width, height, depth }; 492 const size_t region[3] = { width, height, depth };
523 EVENT_LIST (10, items - 10); 493 EVENT_LIST (10, items - 10);
524 494
525 NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 495 NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
526 496
527 if (ev) 497 if (ev)
528 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 498 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
529}
530 499
531void 500void
532enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) 501enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Image dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
533 PPCODE: 502 PPCODE:
534{
535 cl_event ev = 0; 503 cl_event ev = 0;
536 const size_t src_origin[3] = { src_x, src_y, src_z }; 504 const size_t src_origin[3] = { src_x, src_y, src_z };
537 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 505 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
538 const size_t region[3] = { width, height, depth }; 506 const size_t region[3] = { width, height, depth };
539 EVENT_LIST (12, items - 12); 507 EVENT_LIST (12, items - 12);
540 508
541 NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 509 NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
542 510
543 if (ev) 511 if (ev)
544 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 512 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
545}
546 513
547void 514void
548enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...) 515enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...)
549 PPCODE: 516 PPCODE:
550{
551 cl_event ev = 0; 517 cl_event ev = 0;
552 const size_t src_origin[3] = { src_x, src_y, src_z }; 518 const size_t src_origin[3] = { src_x, src_y, src_z };
553 const size_t region[3] = { width, height, depth }; 519 const size_t region[3] = { width, height, depth };
554 EVENT_LIST (10, items - 10); 520 EVENT_LIST (10, items - 10);
555 521
556 NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 522 NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
557 523
558 if (ev) 524 if (ev)
559 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 525 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
560}
561 526
562void 527void
563enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...) 528enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...)
564 PPCODE: 529 PPCODE:
565{
566 cl_event ev = 0; 530 cl_event ev = 0;
567 EVENT_LIST (2, items - 2); 531 EVENT_LIST (2, items - 2);
568 532
569 NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 533 NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
570 534
571 if (ev) 535 if (ev)
572 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 536 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
573}
574 537
575void 538void
576enqueue_nd_range_kernel (OpenCL::Queue this, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...) 539enqueue_nd_range_kernel (OpenCL::Queue this, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...)
577 PPCODE: 540 PPCODE:
578{
579 cl_event ev = 0; 541 cl_event ev = 0;
580 size_t *gwo = 0, *gws, *lws = 0; 542 size_t *gwo = 0, *gws, *lws = 0;
581 int gws_len; 543 int gws_len;
582 size_t *lists; 544 size_t *lists;
583 int i; 545 int i;
584 EVENT_LIST (2, items - 2); 546 EVENT_LIST (5, items - 5);
585 547
586 if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV) 548 if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV)
587 croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference"); 549 croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference");
588 550
589 gws_len = AvFILLp (SvRV (global_work_size)) + 1; 551 gws_len = AvFILLp (SvRV (global_work_size)) + 1;
622 584
623 NEED_SUCCESS (EnqueueNDRangeKernel, (this, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 585 NEED_SUCCESS (EnqueueNDRangeKernel, (this, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
624 586
625 if (ev) 587 if (ev)
626 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 588 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
627}
628 589
629void 590void
630enqueue_marker (OpenCL::Queue this) 591enqueue_marker (OpenCL::Queue this)
631 PPCODE: 592 PPCODE:
632{
633 cl_event ev; 593 cl_event ev;
634 NEED_SUCCESS (EnqueueMarker, (this, &ev)); 594 NEED_SUCCESS (EnqueueMarker, (this, &ev));
635 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 595 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
636}
637 596
638void 597void
639enqueue_wait_for_events (OpenCL::Queue this, ...) 598enqueue_wait_for_events (OpenCL::Queue this, ...)
640 CODE: 599 CODE:
641{
642 EVENT_LIST (1, items - 1); 600 EVENT_LIST (1, items - 1);
643 NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr)); 601 NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr));
644}
645 602
646void 603void
647enqueue_barrier (OpenCL::Queue this) 604enqueue_barrier (OpenCL::Queue this)
648 CODE: 605 CODE:
649 NEED_SUCCESS (EnqueueBarrier, (this)); 606 NEED_SUCCESS (EnqueueBarrier, (this));
700 NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0)); 657 NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0));
701 658
702void 659void
703build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name) 660build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name)
704 PPCODE: 661 PPCODE:
705{
706 size_t size; 662 size_t size;
707 SV *sv;
708
709 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size)); 663 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size));
710 sv = sv_2mortal (newSV (size)); 664 SV *sv = sv_2mortal (newSV (size));
711 SvUPGRADE (sv, SVt_PV); 665 SvUPGRADE (sv, SVt_PV);
712 SvPOK_only (sv); 666 SvPOK_only (sv);
713 SvCUR_set (sv, size); 667 SvCUR_set (sv, size);
714 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0)); 668 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0));
715 XPUSHs (sv); 669 XPUSHs (sv);
716}
717 670
718void 671void
719kernel (OpenCL::Program program, SV *function) 672kernel (OpenCL::Program program, SV *function)
720 PPCODE: 673 PPCODE:
721{
722 cl_int res;
723 cl_kernel kernel = clCreateKernel (program, SvPVbyte_nolen (function), &res); 674 NEED_SUCCESS_ARG (cl_kernel kernel, CreateKernel, (program, SvPVbyte_nolen (function), &res));
724
725 if (res)
726 FAIL (CreateKernel, res);
727
728 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel); 675 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel);
729}
730 676
731MODULE = OpenCL PACKAGE = OpenCL::Kernel 677MODULE = OpenCL PACKAGE = OpenCL::Kernel
732 678
733void 679void
734DESTROY (OpenCL::Kernel this) 680DESTROY (OpenCL::Kernel this)
789set_float (OpenCL::Kernel this, cl_uint idx, cl_float value) 735set_float (OpenCL::Kernel this, cl_uint idx, cl_float value)
790 CODE: 736 CODE:
791 clSetKernelArg (this, idx, sizeof (value), &value); 737 clSetKernelArg (this, idx, sizeof (value), &value);
792 738
793void 739void
740set_double (OpenCL::Kernel this, cl_uint idx, cl_double value)
741 CODE:
742 clSetKernelArg (this, idx, sizeof (value), &value);
743
744void
794set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value) 745set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value)
795 CODE: 746 CODE:
796 clSetKernelArg (this, idx, sizeof (value), &value); 747 clSetKernelArg (this, idx, sizeof (value), &value);
797 748
798void 749void
835void 786void
836wait (OpenCL::Event this) 787wait (OpenCL::Event this)
837 CODE: 788 CODE:
838 clWaitForEvents (1, &this); 789 clWaitForEvents (1, &this);
839 790
791MODULE = OpenCL PACKAGE = OpenCL::UserEvent
792
793void
794set_status (OpenCL::UserEvent this, cl_int execution_status)
795 CODE:
796 clSetUserEventStatus (this, execution_status);
797

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines