… | |
… | |
13 | // in addition, you cannot test for this in any future-proof way. |
13 | // in addition, you cannot test for this in any future-proof way. |
14 | // each time a new opencl version comes out, you need to make a new |
14 | // each time a new opencl version comes out, you need to make a new |
15 | // release. |
15 | // release. |
16 | #define CL_USE_DEPRECATED_OPENCL_1_2_APIS /* just guessing, you stupid idiots */ |
16 | #define CL_USE_DEPRECATED_OPENCL_1_2_APIS /* just guessing, you stupid idiots */ |
17 | |
17 | |
18 | #ifndef PREFER_1_! |
18 | #ifndef PREFER_1_1 |
19 | #define PREFER_1_1 1 |
19 | #define PREFER_1_1 1 |
20 | #endif |
20 | #endif |
21 | |
21 | |
22 | #if PREFER_1_1 |
22 | #if PREFER_1_1 |
23 | #define CL_USE_DEPRECATED_OPENCL_1_1_APIS |
23 | #define CL_USE_DEPRECATED_OPENCL_1_1_APIS |
… | |
… | |
400 | |
400 | |
401 | void |
401 | void |
402 | info (OpenCL::Platform self, cl_platform_info name) |
402 | info (OpenCL::Platform self, cl_platform_info name) |
403 | PPCODE: |
403 | PPCODE: |
404 | INFO (Platform) |
404 | INFO (Platform) |
|
|
405 | |
|
|
406 | void |
|
|
407 | unload_compiler (OpenCL::Platform self) |
|
|
408 | CODE: |
|
|
409 | #if CL_VERSION_1_2 |
|
|
410 | clUnloadPlatformCompiler (self); |
|
|
411 | #endif |
405 | |
412 | |
406 | #BEGIN:platform |
413 | #BEGIN:platform |
407 | |
414 | |
408 | void |
415 | void |
409 | profile (OpenCL::Platform self) |
416 | profile (OpenCL::Platform self) |
… | |
… | |
969 | NEED_SUCCESS (EnqueueWriteBuffer, (self, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
976 | NEED_SUCCESS (EnqueueWriteBuffer, (self, mem, blocking, offset, len, ptr, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
970 | |
977 | |
971 | if (ev) |
978 | if (ev) |
972 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
979 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
973 | |
980 | |
|
|
981 | #if CL_VERSION_1_2 |
|
|
982 | |
|
|
983 | void |
|
|
984 | enqueue_fill_buffer (OpenCL::Queue self, OpenCL::Buffer mem, SV *data, size_t offset, size_t size, ...) |
|
|
985 | PPCODE: |
|
|
986 | cl_event ev = 0; |
|
|
987 | STRLEN len; |
|
|
988 | char *ptr = SvPVbyte (data, len); |
|
|
989 | EVENT_LIST (5, items - 5); |
|
|
990 | |
|
|
991 | NEED_SUCCESS (EnqueueFillBuffer, (self, mem, ptr, len, offset, size, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
|
|
992 | |
|
|
993 | if (ev) |
|
|
994 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
|
|
995 | |
|
|
996 | void |
|
|
997 | enqueue_fill_image (OpenCL::Queue self, OpenCL::Image img, NV r, NV g, NV b, NV a, size_t x, size_t y, size_t z, size_t width, size_t height, size_t depth, ...) |
|
|
998 | PPCODE: |
|
|
999 | cl_event ev = 0; |
|
|
1000 | STRLEN len; |
|
|
1001 | const size_t origin [3] = { x, y, z }; |
|
|
1002 | const size_t region [3] = { width, height, depth }; |
|
|
1003 | EVENT_LIST (12, items - 12); |
|
|
1004 | |
|
|
1005 | const cl_float c_f [4] = { r, g, b, a }; |
|
|
1006 | const cl_uint c_u [4] = { r, g, b, a }; |
|
|
1007 | const cl_int c_s [4] = { r, g, b, a }; |
|
|
1008 | const void *c_fus [3] = { &c_f, &c_u, &c_s }; |
|
|
1009 | static const char fus [] = { 0, 0, 0, 0, 0, 0, 0, 2, 2, 2, 1, 1, 1, 0, 0 }; |
|
|
1010 | cl_image_format format; |
|
|
1011 | NEED_SUCCESS (clGetImageInfo, (img, CL_IMAGE_FORMAT, sizeof (format), &format, 0)); |
|
|
1012 | assert (sizeof (fus) == CL_FLOAT + 1 - CL_SNORM_INT8); |
|
|
1013 | if (format.image_channel_data_type < CL_SNORM_INT8 || CL_FLOAT < format.image_channel_data_type) |
|
|
1014 | croak ("enqueue_fill_image: image has unsupported channel type, only opencl 1.2 channel types supported."); |
|
|
1015 | |
|
|
1016 | NEED_SUCCESS (EnqueueFillImage, (self, img, c_fus [fus [format.image_channel_data_type]], |
|
|
1017 | origin, region, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
|
|
1018 | |
|
|
1019 | if (ev) |
|
|
1020 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
|
|
1021 | |
|
|
1022 | #endif |
|
|
1023 | |
974 | void |
1024 | void |
975 | enqueue_copy_buffer (OpenCL::Queue self, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...) |
1025 | enqueue_copy_buffer (OpenCL::Queue self, OpenCL::Buffer src, OpenCL::Buffer dst, size_t src_offset, size_t dst_offset, size_t len, ...) |
976 | PPCODE: |
1026 | PPCODE: |
977 | cl_event ev = 0; |
1027 | cl_event ev = 0; |
978 | EVENT_LIST (6, items - 6); |
1028 | EVENT_LIST (6, items - 6); |
… | |
… | |
1243 | if (ev) |
1293 | if (ev) |
1244 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
1294 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
1245 | |
1295 | |
1246 | #endif |
1296 | #endif |
1247 | |
1297 | |
1248 | #if !CL_VERSION_1_2 || defined CL_USE_DEPRECATED_OPENCL_1_1_APIS |
|
|
1249 | |
|
|
1250 | void |
1298 | void |
1251 | enqueue_wait_for_events (OpenCL::Queue self, ...) |
1299 | enqueue_wait_for_events (OpenCL::Queue self, ...) |
1252 | CODE: |
1300 | CODE: |
1253 | EVENT_LIST (1, items - 1); |
1301 | EVENT_LIST (1, items - 1); |
|
|
1302 | #if PREFER_1_1 |
1254 | NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr)); |
1303 | NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr)); |
1255 | |
1304 | #else |
|
|
1305 | NEED_SUCCESS (EnqueueBarrierWithWaitList, (self, event_list_count, event_list_ptr, 0)); |
1256 | #endif |
1306 | #endif |
1257 | |
1307 | |
1258 | void |
1308 | void |
1259 | enqueue_marker (OpenCL::Queue self, ...) |
1309 | enqueue_marker (OpenCL::Queue self, ...) |
1260 | PPCODE: |
1310 | PPCODE: |
1261 | cl_event ev = 0; |
1311 | cl_event ev = 0; |
1262 | EVENT_LIST (1, items - 1); |
1312 | EVENT_LIST (1, items - 1); |
|
|
1313 | #if PREFER_1_1 |
|
|
1314 | if (!event_list_count) |
|
|
1315 | NEED_SUCCESS (EnqueueMarker, (self, GIMME_V != G_VOID ? &ev : 0)); |
|
|
1316 | else |
1263 | #if CL_VERSION_1_2 |
1317 | #if CL_VERSION_1_2 |
|
|
1318 | NEED_SUCCESS (EnqueueMarkerWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
|
|
1319 | #else |
|
|
1320 | NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); // also a barrier |
|
|
1321 | #endif |
|
|
1322 | #else |
1264 | NEED_SUCCESS (EnqueueMarkerWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
1323 | NEED_SUCCESS (EnqueueMarkerWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
1265 | #else |
|
|
1266 | if (event_list_count) |
|
|
1267 | croak ("OpenCL::Queue->enqueue_marker does not support a wait list in OpenCL 1.1 - upgrade to 1.2"); |
|
|
1268 | NEED_SUCCESS (EnqueueMarker, (self, GIMME_V != G_VOID ? &ev : 0)); |
|
|
1269 | #endif |
1324 | #endif |
1270 | if (ev) |
1325 | if (ev) |
1271 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
1326 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
1272 | |
1327 | |
1273 | void |
1328 | void |
1274 | enqueue_barrier (OpenCL::Queue self, ...) |
1329 | enqueue_barrier (OpenCL::Queue self, ...) |
1275 | PPCODE: |
1330 | PPCODE: |
1276 | cl_event ev = 0; |
1331 | cl_event ev = 0; |
1277 | EVENT_LIST (1, items - 1); |
1332 | EVENT_LIST (1, items - 1); |
|
|
1333 | #if PREFER_1_1 |
|
|
1334 | if (!event_list_count && GIMME_V == G_VOID) |
|
|
1335 | NEED_SUCCESS (EnqueueBarrier, (self)); |
|
|
1336 | else |
1278 | #if CL_VERSION_1_2 |
1337 | #if CL_VERSION_1_2 |
1279 | NEED_SUCCESS (EnqueueBarrierWithWaitList, (self, event_list_count, event_list_ptr, &ev)); |
1338 | NEED_SUCCESS (EnqueueBarrierWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
1280 | #else |
1339 | #else |
|
|
1340 | { |
1281 | if (event_list_count) |
1341 | if (event_list_count) |
1282 | croak ("OpenCL::Queue->enqueue_barrier does not support a wait list in OpenCL 1.1 - upgrade to 1.2"); |
1342 | NEED_SUCCESS (EnqueueWaitForEvents, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
|
|
1343 | |
1283 | if (GIMME_V != G_VOID) |
1344 | if (GIMME_V != G_VOID) |
1284 | croak ("OpenCL::Queue->enqueue_barrier does not return an event object in OpenCL 1.1 - upgrade to 1.2"); |
|
|
1285 | NEED_SUCCESS (EnqueueBarrier, (self)); |
1345 | NEED_SUCCESS (EnqueueMarker, (self, &ev)); |
|
|
1346 | } |
|
|
1347 | #endif |
|
|
1348 | #else |
|
|
1349 | NEED_SUCCESS (EnqueueBarrierWithWaitList, (self, event_list_count, event_list_ptr, GIMME_V != G_VOID ? &ev : 0)); |
1286 | #endif |
1350 | #endif |
1287 | if (ev) |
1351 | if (ev) |
1288 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
1352 | XPUSH_NEW_OBJ ("OpenCL::Event", ev); |
1289 | |
1353 | |
1290 | void |
1354 | void |
… | |
… | |
1470 | void |
1534 | void |
1471 | image_info (OpenCL::Image self, cl_image_info name) |
1535 | image_info (OpenCL::Image self, cl_image_info name) |
1472 | PPCODE: |
1536 | PPCODE: |
1473 | INFO (Image) |
1537 | INFO (Image) |
1474 | |
1538 | |
|
|
1539 | void |
|
|
1540 | format (OpenCL::Image self) |
|
|
1541 | PPCODE: |
|
|
1542 | cl_image_format format; |
|
|
1543 | NEED_SUCCESS (GetImageInfo, (self, CL_IMAGE_FORMAT, sizeof (format), &format, 0)); |
|
|
1544 | EXTEND (SP, 2); |
|
|
1545 | PUSHs (sv_2mortal (newSVuv (format.image_channel_order))); |
|
|
1546 | PUSHs (sv_2mortal (newSVuv (format.image_channel_data_type))); |
|
|
1547 | |
1475 | #BEGIN:image |
1548 | #BEGIN:image |
1476 | |
1549 | |
1477 | void |
1550 | void |
1478 | element_size (OpenCL::Image self) |
1551 | element_size (OpenCL::Image self) |
1479 | ALIAS: |
1552 | ALIAS: |
… | |
… | |
1636 | void |
1709 | void |
1637 | kernel (OpenCL::Program program, SV *function) |
1710 | kernel (OpenCL::Program program, SV *function) |
1638 | PPCODE: |
1711 | PPCODE: |
1639 | NEED_SUCCESS_ARG (cl_kernel kernel, CreateKernel, (program, SvPVbyte_nolen (function), &res)); |
1712 | NEED_SUCCESS_ARG (cl_kernel kernel, CreateKernel, (program, SvPVbyte_nolen (function), &res)); |
1640 | XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel); |
1713 | XPUSH_NEW_OBJ ("OpenCL::Kernel", kernel); |
|
|
1714 | |
|
|
1715 | void |
|
|
1716 | kernels_in_program (OpenCL::Program program) |
|
|
1717 | PPCODE: |
|
|
1718 | cl_uint num_kernels; |
|
|
1719 | NEED_SUCCESS (CreateKernelsInProgram, (program, 0, 0, &num_kernels)); |
|
|
1720 | cl_kernel *kernels = tmpbuf (sizeof (cl_kernel) * num_kernels); |
|
|
1721 | NEED_SUCCESS (CreateKernelsInProgram, (program, num_kernels, kernels, 0)); |
|
|
1722 | |
|
|
1723 | int i; |
|
|
1724 | EXTEND (SP, num_kernels); |
|
|
1725 | for (i = 0; i < num_kernels; ++i) |
|
|
1726 | PUSHs (NEW_MORTAL_OBJ ("OpenCL::Kernel", kernels [i])); |
1641 | |
1727 | |
1642 | void |
1728 | void |
1643 | info (OpenCL::Program self, cl_program_info name) |
1729 | info (OpenCL::Program self, cl_program_info name) |
1644 | PPCODE: |
1730 | PPCODE: |
1645 | INFO (Program) |
1731 | INFO (Program) |