ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/OpenCL/OpenCL.xs
(Generate patch)

Comparing OpenCL/OpenCL.xs (file contents):
Revision 1.3 by root, Tue Nov 15 20:38:07 2011 UTC vs.
Revision 1.11 by root, Thu Nov 17 04:17:43 2011 UTC

20typedef cl_mem OpenCL__Image3D_ornull; 20typedef cl_mem OpenCL__Image3D_ornull;
21typedef cl_sampler OpenCL__Sampler; 21typedef cl_sampler OpenCL__Sampler;
22typedef cl_program OpenCL__Program; 22typedef cl_program OpenCL__Program;
23typedef cl_kernel OpenCL__Kernel; 23typedef cl_kernel OpenCL__Kernel;
24typedef cl_event OpenCL__Event; 24typedef cl_event OpenCL__Event;
25typedef cl_event OpenCL__UserEvent;
26
27typedef SV *FUTURE;
28
29/*****************************************************************************/
30
31/* up to two temporary buffers */
32static void *
33tmpbuf (size_t size)
34{
35 static int idx;
36 static void *buf [2];
37 static size_t len [2];
38
39 idx ^= 1;
40
41 if (len [idx] < size)
42 {
43 free (buf [idx]);
44 len [idx] = ((size + 31) & ~4095) + 4096 - 32;
45 buf [idx] = malloc (len [idx]);
46 }
47
48 return buf [idx];
49}
50
51/*****************************************************************************/
25 52
26typedef struct 53typedef struct
27{ 54{
28 IV iv; 55 IV iv;
29 const char *name; 56 const char *name;
63 }; 90 };
64 91
65 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)"); 92 return iv2str (err, errstr, sizeof (errstr) / sizeof (errstr [0]), "ERROR(%d)");
66} 93}
67 94
95/*****************************************************************************/
96
97static cl_int res;
98
68#define FAIL(name,res) \ 99#define FAIL(name) \
69 croak ("cl" # name ": %s", err2str (res)); 100 croak ("cl" # name ": %s", err2str (res));
70 101
71#define NEED_SUCCESS(name,args) \ 102#define NEED_SUCCESS(name,args) \
72 do { \ 103 do { \
73 cl_int res = cl ## name args; \ 104 res = cl ## name args; \
74 \ 105 \
75 if (res) \ 106 if (res) \
76 FAIL (name, res); \ 107 FAIL (name); \
77 } while (0) 108 } while (0)
109
110#define NEED_SUCCESS_ARG(retdecl, name, args) \
111 retdecl = cl ## name args; \
112 if (res) \
113 FAIL (name);
114
115/*****************************************************************************/
78 116
79#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr) 117#define NEW_MORTAL_OBJ(class,ptr) sv_setref_pv (sv_newmortal (), class, ptr)
80#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr)) 118#define XPUSH_NEW_OBJ(class,ptr) XPUSHs (NEW_MORTAL_OBJ (class, ptr))
81 119
82/*TODO*/ 120static void *
83#define EVENT_LIST(items,count) cl_uint event_list_count = 0; cl_event *event_list_ptr = 0 121SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
122{
123 if (SvROK (sv) && sv_derived_from (sv, pkg))
124 return (void *)SvIV (SvRV (sv));
125
126 croak ("%s: %s is not of type %s", func, svname, pkg);
127}
128
129/*****************************************************************************/
130
131static size_t
132img_row_pitch (cl_mem img)
133{
134 size_t res;
135 clGetImageInfo (img, CL_IMAGE_ROW_PITCH, sizeof (res), &res, 0);
136 return res;
137}
138
139static cl_event *
140event_list (SV **items, int count)
141{
142 cl_event *list = tmpbuf (sizeof (cl_event) * count);
143
144 while (count--)
145 list [count] = SvPTROBJ ("clEnqueue", "wait_events", items [count], "OpenCL::Event");
146
147 return list;
148}
149
150#define EVENT_LIST(items,count) \
151 cl_uint event_list_count = (count); \
152 cl_event *event_list_ptr = event_list (&ST (items), event_list_count)
84 153
85#define INFO(class) \ 154#define INFO(class) \
86{ \ 155{ \
87 size_t size; \ 156 size_t size; \
88 SV *sv; \
89 \
90 NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \ 157 NEED_SUCCESS (Get ## class ## Info, (this, name, 0, 0, &size)); \
91 sv = sv_2mortal (newSV (size)); \ 158 SV *sv = sv_2mortal (newSV (size)); \
92 SvUPGRADE (sv, SVt_PV); \ 159 SvUPGRADE (sv, SVt_PV); \
93 SvPOK_only (sv); \ 160 SvPOK_only (sv); \
94 SvCUR_set (sv, size); \ 161 SvCUR_set (sv, size); \
95 NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \ 162 NEED_SUCCESS (Get ## class ## Info, (this, name, size, SvPVX (sv), 0)); \
96 XPUSHs (sv); \ 163 XPUSHs (sv); \
97} 164}
98 165
99static void *
100SvPTROBJ (const char *func, const char *svname, SV *sv, const char *pkg)
101{
102 if (SvROK (sv) && sv_derived_from (sv, pkg))
103 return (void *)SvIV (SvRV (sv));
104
105 croak ("%s: %s is not of type %s", func, svname, pkg);
106}
107
108MODULE = OpenCL PACKAGE = OpenCL 166MODULE = OpenCL PACKAGE = OpenCL
109 167
110PROTOTYPES: ENABLE 168PROTOTYPES: ENABLE
111 169
112BOOT: 170BOOT:
113{ 171{
114 HV *stash = gv_stashpv ("OpenCL", 1); 172 HV *stash = gv_stashpv ("OpenCL", 1);
115 static const ivstr *civ, const_iv[] = { 173 static const ivstr *civ, const_iv[] = {
116 { sizeof (cl_char ), "SIZEOF_CHAR" }, 174 { sizeof (cl_char ), "SIZEOF_CHAR" },
117 { sizeof (cl_uchar ), "SIZEOF_UCHAR" }, 175 { sizeof (cl_uchar ), "SIZEOF_UCHAR" },
118 { sizeof (cl_short ), "SIZEOF_SHORT" }, 176 { sizeof (cl_short ), "SIZEOF_SHORT" },
119 { sizeof (cl_ushort), "SIZEOF_USHORT"}, 177 { sizeof (cl_ushort), "SIZEOF_USHORT" },
120 { sizeof (cl_int ), "SIZEOF_INT" }, 178 { sizeof (cl_int ), "SIZEOF_INT" },
121 { sizeof (cl_uint ), "SIZEOF_UINT" }, 179 { sizeof (cl_uint ), "SIZEOF_UINT" },
122 { sizeof (cl_long ), "SIZEOF_LONG" }, 180 { sizeof (cl_long ), "SIZEOF_LONG" },
123 { sizeof (cl_ulong ), "SIZEOF_ULONG" }, 181 { sizeof (cl_ulong ), "SIZEOF_ULONG" },
124 { sizeof (cl_half ), "SIZEOF_HALF" }, 182 { sizeof (cl_half ), "SIZEOF_HALF" },
125 { sizeof (cl_float ), "SIZEOF_FLOAT" }, 183 { sizeof (cl_float ), "SIZEOF_FLOAT" },
184 { sizeof (cl_double), "SIZEOF_DOUBLE" },
126#include "constiv.h" 185#include "constiv.h"
127 }; 186 };
128 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--) 187 for (civ = const_iv + sizeof (const_iv) / sizeof (const_iv [0]); civ > const_iv; civ--)
129 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv)); 188 newCONSTSUB (stash, (char *)civ[-1].name, newSViv (civ[-1].iv));
130} 189}
131 190
191cl_int
192errno ()
193 CODE:
194 errno = res;
195
132const char * 196const char *
133err2str (cl_int err) 197err2str (cl_int err)
134 198
135const char * 199const char *
136enum2str (cl_uint value) 200enum2str (cl_uint value)
137 201
138void 202void
139platforms () 203platforms ()
140 PPCODE: 204 PPCODE:
141{
142 cl_platform_id *list; 205 cl_platform_id *list;
143 cl_uint count; 206 cl_uint count;
144 int i; 207 int i;
145 208
146 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count)); 209 NEED_SUCCESS (GetPlatformIDs, (0, 0, &count));
147 Newx (list, count, cl_platform_id); 210 list = tmpbuf (sizeof (*list) * count);
148 NEED_SUCCESS (GetPlatformIDs, (count, list, 0)); 211 NEED_SUCCESS (GetPlatformIDs, (count, list, 0));
149 212
150 EXTEND (SP, count); 213 EXTEND (SP, count);
151 for (i = 0; i < count; ++i) 214 for (i = 0; i < count; ++i)
152 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i])); 215 PUSHs (NEW_MORTAL_OBJ ("OpenCL::Platform", list [i]));
153 216
154 Safefree (list);
155}
156
157void 217void
158context_from_type_simple (cl_device_type type = CL_DEVICE_TYPE_DEFAULT) 218context_from_type (FUTURE properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
159 PPCODE: 219 PPCODE:
160{
161 cl_int res;
162 cl_context ctx = clCreateContextFromType (0, type, 0, 0, &res); 220 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (0, type, 0, 0, &res));
163
164 if (res)
165 FAIL (CreateContextFromType, res);
166
167 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 221 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
168} 222
223void
224context (FUTURE properties, FUTURE devices, FUTURE notify = 0)
225 PPCODE:
226 /* der Gipfel der Kunst */
169 227
170void 228void
171wait_for_events (...) 229wait_for_events (...)
172 CODE: 230 CODE:
173{
174 EVENT_LIST (0, items); 231 EVENT_LIST (0, items);
175 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr)); 232 NEED_SUCCESS (WaitForEvents, (event_list_count, event_list_ptr));
176}
177 233
178PROTOTYPES: DISABLE 234PROTOTYPES: DISABLE
179 235
180MODULE = OpenCL PACKAGE = OpenCL::Platform 236MODULE = OpenCL PACKAGE = OpenCL::Platform
181 237
185 INFO (Platform) 241 INFO (Platform)
186 242
187void 243void
188devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL) 244devices (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_ALL)
189 PPCODE: 245 PPCODE:
190{
191 cl_device_id *list; 246 cl_device_id *list;
192 cl_uint count; 247 cl_uint count;
193 int i; 248 int i;
194 249
195 NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count)); 250 NEED_SUCCESS (GetDeviceIDs, (this, type, 0, 0, &count));
196 Newx (list, count, cl_device_id); 251 list = tmpbuf (sizeof (*list) * count);
197 NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0)); 252 NEED_SUCCESS (GetDeviceIDs, (this, type, count, list, 0));
198 253
199 EXTEND (SP, count); 254 EXTEND (SP, count);
200 for (i = 0; i < count; ++i) 255 for (i = 0; i < count; ++i)
201 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i])); 256 PUSHs (sv_setref_pv (sv_newmortal (), "OpenCL::Device", list [i]));
202 257
203 Safefree (list);
204}
205
206void 258void
259context (OpenCL::Platform this, FUTURE properties, SV *devices, FUTURE notify = 0)
260 PPCODE:
261 if (!SvROK (devices) || SvTYPE (SvRV (devices)) != SVt_PVAV)
262 croak ("OpenCL::Platform argument 'device' must be an arrayref with device objects, in call");
263
264 AV *av = (AV *)SvRV (devices);
265 cl_uint num_devices = av_len (av) + 1;
266 cl_device_id *device_list = tmpbuf (sizeof (cl_device_id) * num_devices);
267 int i;
268
269 for (i = num_devices; i--; )
270 device_list [i] = SvPTROBJ ("clCreateContext", "devices", *av_fetch (av, i, 0), "OpenCL::Device");
271
272 NEED_SUCCESS_ARG (cl_context ctx, CreateContext, (0, num_devices, device_list, 0, 0, &res));
273 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
274
275void
207context_from_type_simple (OpenCL::Platform this, cl_device_type type = CL_DEVICE_TYPE_DEFAULT) 276context_from_type (OpenCL::Platform this, FUTURE properties = 0, cl_device_type type = CL_DEVICE_TYPE_DEFAULT, FUTURE notify = 0)
208 PPCODE: 277 PPCODE:
209{
210 cl_int res;
211 cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 }; 278 cl_context_properties props[] = { CL_CONTEXT_PLATFORM, (cl_context_properties)this, 0 };
212 cl_context ctx = clCreateContextFromType (props, type, 0, 0, &res); 279 NEED_SUCCESS_ARG (cl_context ctx, CreateContextFromType, (props, type, 0, 0, &res));
213
214 if (res)
215 FAIL (CreateContextFromType, res);
216
217 XPUSH_NEW_OBJ ("OpenCL::Context", ctx); 280 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
218}
219 281
220MODULE = OpenCL PACKAGE = OpenCL::Device 282MODULE = OpenCL PACKAGE = OpenCL::Device
221 283
222void 284void
223info (OpenCL::Device this, cl_device_info name) 285info (OpenCL::Device this, cl_device_info name)
224 PPCODE: 286 PPCODE:
225 INFO (Device) 287 INFO (Device)
226 288
227void
228context_simple (OpenCL::Device this)
229 PPCODE:
230{
231 cl_int res;
232 cl_context ctx = clCreateContext (0, 1, &this, 0, 0, &res);
233
234 if (res)
235 FAIL (CreateContext, res);
236
237 XPUSH_NEW_OBJ ("OpenCL::Context", ctx);
238}
239
240MODULE = OpenCL PACKAGE = OpenCL::Context 289MODULE = OpenCL PACKAGE = OpenCL::Context
241 290
242void 291void
243DESTROY (OpenCL::Context context) 292DESTROY (OpenCL::Context context)
244 CODE: 293 CODE:
248info (OpenCL::Context this, cl_context_info name) 297info (OpenCL::Context this, cl_context_info name)
249 PPCODE: 298 PPCODE:
250 INFO (Context) 299 INFO (Context)
251 300
252void 301void
253command_queue_simple (OpenCL::Context this, OpenCL::Device device) 302queue (OpenCL::Context this, OpenCL::Device device, cl_command_queue_properties properties = 0)
254 PPCODE: 303 PPCODE:
255{
256 cl_int res;
257 cl_command_queue queue = clCreateCommandQueue (this, device, 0, &res); 304 NEED_SUCCESS_ARG (cl_command_queue queue, CreateCommandQueue, (this, device, properties, &res));
258
259 if (res)
260 FAIL (CreateCommandQueue, res);
261
262 XPUSH_NEW_OBJ ("OpenCL::Queue", queue); 305 XPUSH_NEW_OBJ ("OpenCL::Queue", queue);
263} 306
307void
308user_event (OpenCL::Context this)
309 PPCODE:
310 NEED_SUCCESS_ARG (cl_event ev, CreateUserEvent, (this, &res));
311 XPUSH_NEW_OBJ ("OpenCL::UserEvent", ev);
264 312
265void 313void
266buffer (OpenCL::Context this, cl_mem_flags flags, size_t len) 314buffer (OpenCL::Context this, cl_mem_flags flags, size_t len)
267 PPCODE: 315 PPCODE:
268{
269 cl_int res;
270 cl_mem mem;
271
272 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)) 316 if (flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))
273 croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?"); 317 croak ("clCreateBuffer: cannot use/copy host ptr when no data is given, use $context->buffer_sv instead?");
274 318
275 mem = clCreateBuffer (this, flags, len, 0, &res); 319 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (this, flags, len, 0, &res));
276
277 if (res)
278 FAIL (CreateBuffer, res);
279
280 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); 320 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
281}
282 321
283void 322void
284buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data) 323buffer_sv (OpenCL::Context this, cl_mem_flags flags, SV *data)
285 PPCODE: 324 PPCODE:
286{
287 STRLEN len; 325 STRLEN len;
288 char *ptr = SvPVbyte (data, len); 326 char *ptr = SvPVbyte (data, len);
289 cl_int res;
290 cl_mem mem;
291 327
292 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR))) 328 if (!(flags & (CL_MEM_USE_HOST_PTR | CL_MEM_COPY_HOST_PTR)))
293 croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?"); 329 croak ("clCreateBuffer: have to specify use or copy host ptr when buffer data is given, use $context->buffer instead?");
294 330
295 mem = clCreateBuffer (this, flags, len, ptr, &res); 331 NEED_SUCCESS_ARG (cl_mem mem, CreateBuffer, (this, flags, len, ptr, &res));
296
297 if (res)
298 FAIL (CreateBuffer, res);
299
300 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem); 332 XPUSH_NEW_OBJ ("OpenCL::Buffer", mem);
301}
302 333
303void 334void
304image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, SV *data) 335image2d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t row_pitch, SV *data)
305 PPCODE: 336 PPCODE:
306{
307 STRLEN len; 337 STRLEN len;
308 char *ptr = SvPVbyte (data, len); 338 char *ptr = SvPVbyte (data, len);
309 const cl_image_format format = { channel_order, channel_type }; 339 const cl_image_format format = { channel_order, channel_type };
310 cl_int res;
311 cl_mem mem = clCreateImage2D (this, flags, &format, width, height, len / height, ptr, &res); 340 NEED_SUCCESS_ARG (cl_mem mem, CreateImage2D, (this, flags, &format, width, height, row_pitch, ptr, &res));
312
313 if (res)
314 FAIL (CreateImage2D, res);
315
316 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem); 341 XPUSH_NEW_OBJ ("OpenCL::Image2D", mem);
317}
318 342
319void 343void
320image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t slice_pitch, SV *data) 344image3d (OpenCL::Context this, cl_mem_flags flags, cl_channel_order channel_order, cl_channel_type channel_type, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data)
321 PPCODE: 345 PPCODE:
322{
323 STRLEN len; 346 STRLEN len;
324 char *ptr = SvPVbyte (data, len); 347 char *ptr = SvPVbyte (data, len);
325 const cl_image_format format = { channel_order, channel_type }; 348 const cl_image_format format = { channel_order, channel_type };
326 cl_int res; 349 NEED_SUCCESS_ARG (cl_mem mem, CreateImage3D, (this, flags, &format, width, height, depth, row_pitch, slice_pitch, ptr, &res));
327 cl_mem mem = clCreateImage3D (this, flags, &format, width, height,
328 depth, len / (height * slice_pitch), slice_pitch, ptr, &res);
329
330 if (res)
331 FAIL (CreateImage3D, res);
332
333 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem); 350 XPUSH_NEW_OBJ ("OpenCL::Image3D", mem);
334}
335 351
336void 352void
337supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type) 353supported_image_formats (OpenCL::Context this, cl_mem_flags flags, cl_mem_object_type image_type)
338 PPCODE: 354 PPCODE:
339{ 355{
356} 372}
357 373
358void 374void
359sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode) 375sampler (OpenCL::Context this, cl_bool normalized_coords, cl_addressing_mode addressing_mode, cl_filter_mode filter_mode)
360 PPCODE: 376 PPCODE:
361{
362 cl_int res;
363 cl_sampler sampler = clCreateSampler (this, normalized_coords, addressing_mode, filter_mode, &res); 377 NEED_SUCCESS_ARG (cl_sampler sampler, CreateSampler, (this, normalized_coords, addressing_mode, filter_mode, &res));
364
365 if (res)
366 FAIL (CreateSampler, res);
367
368 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler); 378 XPUSH_NEW_OBJ ("OpenCL::Sampler", sampler);
369}
370 379
371void 380void
372program_with_source (OpenCL::Context this, SV *program) 381program_with_source (OpenCL::Context this, SV *program)
373 PPCODE: 382 PPCODE:
374{
375 STRLEN len; 383 STRLEN len;
376 size_t len2; 384 size_t len2;
377 const char *ptr = SvPVbyte (program, len); 385 const char *ptr = SvPVbyte (program, len);
378 cl_int res;
379 cl_program prog;
380 386
381 len2 = len; 387 len2 = len;
382 prog = clCreateProgramWithSource (this, 1, &ptr, &len2, &res); 388 NEED_SUCCESS_ARG (cl_program prog, CreateProgramWithSource, (this, 1, &ptr, &len2, &res));
383
384 if (res)
385 FAIL (CreateProgramWithSource, res);
386
387 XPUSH_NEW_OBJ ("OpenCL::Program", prog); 389 XPUSH_NEW_OBJ ("OpenCL::Program", prog);
388}
389 390
390MODULE = OpenCL PACKAGE = OpenCL::Queue 391MODULE = OpenCL PACKAGE = OpenCL::Queue
391 392
392void 393void
393DESTROY (OpenCL::Queue this) 394DESTROY (OpenCL::Queue this)
400 INFO (CommandQueue) 401 INFO (CommandQueue)
401 402
402void 403void
403enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...) 404enqueue_read_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, size_t len, SV *data, ...)
404 PPCODE: 405 PPCODE:
405{
406 cl_event ev = 0; 406 cl_event ev = 0;
407 EVENT_LIST (6, items - 6); 407 EVENT_LIST (6, items - 6);
408 408
409 SvUPGRADE (data, SVt_PV); 409 SvUPGRADE (data, SVt_PV);
410 SvGROW (data, len); 410 SvGROW (data, len);
412 SvCUR_set (data, len); 412 SvCUR_set (data, len);
413 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 413 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
414 414
415 if (ev) 415 if (ev)
416 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 416 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
417}
418 417
419void 418void
420enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...) 419enqueue_write_buffer (OpenCL::Queue this, OpenCL::Buffer mem, cl_bool blocking, size_t offset, SV *data, ...)
421 PPCODE: 420 PPCODE:
422{
423 cl_event ev = 0; 421 cl_event ev = 0;
424 STRLEN len; 422 STRLEN len;
425 char *ptr = SvPVbyte (data, len); 423 char *ptr = SvPVbyte (data, len);
426 EVENT_LIST (5, items - 5); 424 EVENT_LIST (5, items - 5);
427 425
428 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 426 NEED_SUCCESS (EnqueueReadBuffer, (this, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
429 427
430 if (ev) 428 if (ev)
431 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 429 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
432}
433 430
434void 431void
435enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...) 432enqueue_copy_buffer (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...)
436 PPCODE: 433 PPCODE:
437{
438 cl_event ev = 0; 434 cl_event ev = 0;
439 EVENT_LIST (6, items - 6); 435 EVENT_LIST (6, items - 6);
440 436
441 NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 437 NEED_SUCCESS (EnqueueCopyBuffer, (this, src, dst, src_offset, dst_offset, len, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
442 438
443 if (ev) 439 if (ev)
444 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 440 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
445}
446
447 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueReadBufferRect.html */
448 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWriteBufferRect.html */
449 441
450void 442void
451enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...) 443enqueue_read_image (OpenCL::Queue this, OpenCL::Image src, cl_bool blocking, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
452 PPCODE: 444 PPCODE:
453{
454 cl_event ev = 0; 445 cl_event ev = 0;
455 const size_t src_origin[3] = { src_x, src_y, src_z }; 446 const size_t src_origin[3] = { src_x, src_y, src_z };
456 const size_t region[3] = { width, height, depth }; 447 const size_t region[3] = { width, height, depth };
457 size_t len = row_pitch * slice_pitch * depth;
458 EVENT_LIST (11, items - 11); 448 EVENT_LIST (12, items - 12);
449
450 if (!row_pitch)
451 row_pitch = img_row_pitch (src);
452
453 if (depth > 1 && !slice_pitch)
454 slice_pitch = row_pitch * height;
455
456 size_t len = slice_pitch ? slice_pitch * depth : row_pitch * height;
459 457
460 SvUPGRADE (data, SVt_PV); 458 SvUPGRADE (data, SVt_PV);
461 SvGROW (data, len); 459 SvGROW (data, len);
462 SvPOK_only (data); 460 SvPOK_only (data);
463 SvCUR_set (data, len); 461 SvCUR_set (data, len);
464 NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 462 NEED_SUCCESS (EnqueueReadImage, (this, src, blocking, src_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
465 463
466 if (ev) 464 if (ev)
467 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 465 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
468}
469 466
470void 467void
471enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, SV *data, ...) 468enqueue_write_image (OpenCL::Queue this, OpenCL::Image dst, cl_bool blocking, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t row_pitch, size_t slice_pitch, SV *data, ...)
472 PPCODE: 469 PPCODE:
473{
474 cl_event ev = 0; 470 cl_event ev = 0;
475 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 471 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
476 const size_t region[3] = { width, height, depth }; 472 const size_t region[3] = { width, height, depth };
477 STRLEN len; 473 STRLEN len;
478 char *ptr = SvPVbyte (data, len); 474 char *ptr = SvPVbyte (data, len);
479 size_t slice_pitch = len / (row_pitch * height);
480 EVENT_LIST (11, items - 11); 475 EVENT_LIST (12, items - 12);
476
477 if (!row_pitch)
478 row_pitch = img_row_pitch (dst);
479
480 if (depth > 1 && !slice_pitch)
481 slice_pitch = row_pitch * height;
482
483 size_t min_len = slice_pitch ? slice_pitch * depth : row_pitch * height;
484
485 if (len < min_len)
486 croak ("clEnqueueWriteImage: data string is shorter than what would be transferred");
481 487
482 NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 488 NEED_SUCCESS (EnqueueWriteImage, (this, dst, blocking, dst_origin, region, row_pitch, slice_pitch, SvPVX (data), event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
483 489
484 if (ev) 490 if (ev)
485 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 491 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
486}
487 492
488void 493void
489enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...) 494enqueue_copy_buffer_rect (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, size_t src_row_pitch, size_t src_slice_pitch, size_t dst_row_pitch, size_t dst_slice_pitch, ...)
490 PPCODE: 495 PPCODE:
491{
492 cl_event ev = 0; 496 cl_event ev = 0;
493 const size_t src_origin[3] = { src_x, src_y, src_z }; 497 const size_t src_origin[3] = { src_x, src_y, src_z };
494 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 498 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
495 const size_t region[3] = { width, height, depth }; 499 const size_t region[3] = { width, height, depth };
496 EVENT_LIST (16, items - 16); 500 EVENT_LIST (16, items - 16);
497 501
498 NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 502 NEED_SUCCESS (EnqueueCopyBufferRect, (this, src, dst, src_origin, dst_origin, region, src_row_pitch, src_slice_pitch, dst_row_pitch, dst_slice_pitch, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
499 503
500 if (ev) 504 if (ev)
501 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 505 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
502}
503 506
504void 507void
505enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) 508enqueue_copy_buffer_to_image (OpenCL::Queue this, OpenCL::Buffer src, OpenCL::Image dst, size_t src_offset, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
506 PPCODE: 509 PPCODE:
507{
508 cl_event ev = 0; 510 cl_event ev = 0;
509 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 511 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
510 const size_t region[3] = { width, height, depth }; 512 const size_t region[3] = { width, height, depth };
511 EVENT_LIST (10, items - 10); 513 EVENT_LIST (10, items - 10);
512 514
513 NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 515 NEED_SUCCESS (EnqueueCopyBufferToImage, (this, src, dst, src_offset, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
514 516
515 if (ev) 517 if (ev)
516 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 518 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
517}
518 519
519void 520void
520enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...) 521enqueue_copy_image (OpenCL::Queue this, OpenCL::Image src, OpenCL::Image dst, size_t src_x, size_t src_y, size_t src_z, size_t dst_x, size_t dst_y, size_t dst_z, size_t width, size_t height, size_t depth, ...)
521 PPCODE: 522 PPCODE:
522{
523 cl_event ev = 0; 523 cl_event ev = 0;
524 const size_t src_origin[3] = { src_x, src_y, src_z }; 524 const size_t src_origin[3] = { src_x, src_y, src_z };
525 const size_t dst_origin[3] = { dst_x, dst_y, dst_z }; 525 const size_t dst_origin[3] = { dst_x, dst_y, dst_z };
526 const size_t region[3] = { width, height, depth }; 526 const size_t region[3] = { width, height, depth };
527 EVENT_LIST (12, items - 12); 527 EVENT_LIST (12, items - 12);
528 528
529 NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 529 NEED_SUCCESS (EnqueueCopyImage, (this, src, dst, src_origin, dst_origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
530 530
531 if (ev) 531 if (ev)
532 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 532 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
533}
534 533
535void 534void
536enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...) 535enqueue_copy_image_to_buffer (OpenCL::Queue this, OpenCL::Image src, OpenCL::Buffer dst, size_t src_x, size_t src_y, size_t src_z, size_t width, size_t height, size_t depth, size_t dst_offset, ...)
537 PPCODE: 536 PPCODE:
538{
539 cl_event ev = 0; 537 cl_event ev = 0;
540 const size_t src_origin[3] = { src_x, src_y, src_z }; 538 const size_t src_origin[3] = { src_x, src_y, src_z };
541 const size_t region[3] = { width, height, depth }; 539 const size_t region[3] = { width, height, depth };
542 EVENT_LIST (10, items - 10); 540 EVENT_LIST (10, items - 10);
543 541
544 NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 542 NEED_SUCCESS (EnqueueCopyImageToBuffer, (this, src, dst, src_origin, region, dst_offset, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
545 543
546 if (ev) 544 if (ev)
547 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 545 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
548}
549 546
550void 547void
551enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...) 548enqueue_task (OpenCL::Queue this, OpenCL::Kernel kernel, ...)
552 PPCODE: 549 PPCODE:
553{
554 cl_event ev = 0; 550 cl_event ev = 0;
555 EVENT_LIST (2, items - 2); 551 EVENT_LIST (2, items - 2);
556 552
557 NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); 553 NEED_SUCCESS (EnqueueTask, (this, kernel, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
558 554
559 if (ev) 555 if (ev)
560 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 556 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
561}
562 557
563 /*TODO http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueNDRangeKernel.html */ 558void
559enqueue_nd_range_kernel (OpenCL::Queue this, OpenCL::Kernel kernel, SV *global_work_offset, SV *global_work_size, SV *local_work_size = &PL_sv_undef, ...)
560 PPCODE:
561 cl_event ev = 0;
562 size_t *gwo = 0, *gws, *lws = 0;
563 int gws_len;
564 size_t *lists;
565 int i;
566 EVENT_LIST (5, items - 5);
567
568 if (!SvROK (global_work_size) || SvTYPE (SvRV (global_work_size)) != SVt_PVAV)
569 croak ("clEnqueueNDRangeKernel: global_work_size must be an array reference");
570
571 gws_len = AvFILLp (SvRV (global_work_size)) + 1;
572
573 lists = tmpbuf (sizeof (size_t) * 3 * gws_len);
574
575 gws = lists + gws_len * 0;
576 for (i = 0; i < gws_len; ++i)
577 gws [i] = SvIV (AvARRAY (SvRV (global_work_size))[i]);
578
579 if (SvOK (global_work_offset))
580 {
581 if (!SvROK (global_work_offset) || SvTYPE (SvRV (global_work_offset)) != SVt_PVAV)
582 croak ("clEnqueueNDRangeKernel: global_work_offset must be undef or an array reference");
583
584 if (AvFILLp (SvRV (global_work_size)) + 1 != gws_len)
585 croak ("clEnqueueNDRangeKernel: global_work_offset must be undef or an array of same size as global_work_size");
586
587 gwo = lists + gws_len * 1;
588 for (i = 0; i < gws_len; ++i)
589 gwo [i] = SvIV (AvARRAY (SvRV (global_work_offset))[i]);
590 }
591
592 if (SvOK (local_work_size))
593 {
594 if (SvOK (local_work_size) && !SvROK (local_work_size) || SvTYPE (SvRV (local_work_size)) != SVt_PVAV)
595 croak ("clEnqueueNDRangeKernel: global_work_size must be undef or an array reference");
596
597 if (AvFILLp (SvRV (local_work_size)) + 1 != gws_len)
598 croak ("clEnqueueNDRangeKernel: local_work_local must be undef or an array of same size as global_work_size");
599
600 lws = lists + gws_len * 2;
601 for (i = 0; i < gws_len; ++i)
602 lws [i] = SvIV (AvARRAY (SvRV (local_work_size))[i]);
603 }
604
605 NEED_SUCCESS (EnqueueNDRangeKernel, (this, kernel, gws_len, gwo, gws, lws, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0));
606
607 if (ev)
608 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
564 609
565void 610void
566enqueue_marker (OpenCL::Queue this) 611enqueue_marker (OpenCL::Queue this)
567 PPCODE: 612 PPCODE:
568{
569 cl_event ev; 613 cl_event ev;
570 NEED_SUCCESS (EnqueueMarker, (this, &ev)); 614 NEED_SUCCESS (EnqueueMarker, (this, &ev));
571 XPUSH_NEW_OBJ ("OpenCL::Event", ev); 615 XPUSH_NEW_OBJ ("OpenCL::Event", ev);
572}
573 616
574void 617void
575enqueue_wait_for_events (OpenCL::Queue this, ...) 618enqueue_wait_for_events (OpenCL::Queue this, ...)
576 CODE: 619 CODE:
577{
578 EVENT_LIST (1, items - 1); 620 EVENT_LIST (1, items - 1);
579 NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr)); 621 NEED_SUCCESS (EnqueueWaitForEvents, (this, event_list_count, event_list_ptr));
580}
581 622
582void 623void
583enqueue_barrier (OpenCL::Queue this) 624enqueue_barrier (OpenCL::Queue this)
584 CODE: 625 CODE:
585 NEED_SUCCESS (EnqueueBarrier, (this)); 626 NEED_SUCCESS (EnqueueBarrier, (this));
636 NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0)); 677 NEED_SUCCESS (BuildProgram, (this, 1, &device, SvPVbyte_nolen (options), 0, 0));
637 678
638void 679void
639build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name) 680build_info (OpenCL::Program this, OpenCL::Device device, cl_program_build_info name)
640 PPCODE: 681 PPCODE:
641{
642 size_t size; 682 size_t size;
643 SV *sv;
644
645 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size)); 683 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, 0, 0, &size));
646 sv = sv_2mortal (newSV (size)); 684 SV *sv = sv_2mortal (newSV (size));
647 SvUPGRADE (sv, SVt_PV); 685 SvUPGRADE (sv, SVt_PV);
648 SvPOK_only (sv); 686 SvPOK_only (sv);
649 SvCUR_set (sv, size); 687 SvCUR_set (sv, size);
650 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0)); 688 NEED_SUCCESS (GetProgramBuildInfo, (this, device, name, size, SvPVX (sv), 0));
651 XPUSHs (sv); 689 XPUSHs (sv);
652}
653 690
654void 691void
655kernel (OpenCL::Program program, SV *function) 692kernel (OpenCL::Program program, SV *function)
656 PPCODE: 693 PPCODE:
657{
658 cl_int res;
659 cl_kernel kernel = clCreateKernel (program, SvPVbyte_nolen (function), &res); 694 NEED_SUCCESS_ARG (cl_kernel kernel, CreateKernel, (program, SvPVbyte_nolen (function), &res));
660
661 if (res)
662 FAIL (CreateKernel, res);
663
664 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel); 695 XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel);
665}
666 696
667MODULE = OpenCL PACKAGE = OpenCL::Kernel 697MODULE = OpenCL PACKAGE = OpenCL::Kernel
668 698
669void 699void
670DESTROY (OpenCL::Kernel this) 700DESTROY (OpenCL::Kernel this)
725set_float (OpenCL::Kernel this, cl_uint idx, cl_float value) 755set_float (OpenCL::Kernel this, cl_uint idx, cl_float value)
726 CODE: 756 CODE:
727 clSetKernelArg (this, idx, sizeof (value), &value); 757 clSetKernelArg (this, idx, sizeof (value), &value);
728 758
729void 759void
760set_double (OpenCL::Kernel this, cl_uint idx, cl_double value)
761 CODE:
762 clSetKernelArg (this, idx, sizeof (value), &value);
763
764void
730set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value) 765set_memory (OpenCL::Kernel this, cl_uint idx, OpenCL::Memory_ornull value)
731 CODE: 766 CODE:
732 clSetKernelArg (this, idx, sizeof (value), &value); 767 clSetKernelArg (this, idx, sizeof (value), &value);
733 768
734void 769void
771void 806void
772wait (OpenCL::Event this) 807wait (OpenCL::Event this)
773 CODE: 808 CODE:
774 clWaitForEvents (1, &this); 809 clWaitForEvents (1, &this);
775 810
811MODULE = OpenCL PACKAGE = OpenCL::UserEvent
812
813void
814set_status (OpenCL::UserEvent this, cl_int execution_status)
815 CODE:
816 clSetUserEventStatus (this, execution_status);
817

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines