… | |
… | |
157 | $id = get_global_id (0); |
157 | $id = get_global_id (0); |
158 | output [id] = input [id] * input [id]; |
158 | output [id] = input [id] * input [id]; |
159 | } |
159 | } |
160 | '; |
160 | '; |
161 | |
161 | |
162 | my $prog = $ctx->program_with_source ($src); |
162 | my $prog = $ctx->build_program ($src); |
163 | |
|
|
164 | # build croaks on compile errors, so catch it and print the compile errors |
|
|
165 | eval { $prog->build ($dev, "-cl-fast-relaxed-math"); 1 } |
|
|
166 | or die $prog->build_log; |
|
|
167 | |
|
|
168 | my $kernel = $prog->kernel ("squareit"); |
163 | my $kernel = $prog->kernel ("squareit"); |
169 | |
164 | |
170 | =head2 Create some input and output float buffers, then call the |
165 | =head2 Create some input and output float buffers, then call the |
171 | 'squareit' kernel on them. |
166 | 'squareit' kernel on them. |
172 | |
167 | |
… | |
… | |
267 | |
262 | |
268 | float3 colour = (float3)(z.x, z.y, z.x * z.y); |
263 | float3 colour = (float3)(z.x, z.y, z.x * z.y); |
269 | write_imagef (img, (int2)(get_global_id (0), get_global_id (1)), (float4)(colour * p.x * p.x, 1.)); |
264 | write_imagef (img, (int2)(get_global_id (0), get_global_id (1)), (float4)(colour * p.x * p.x, 1.)); |
270 | } |
265 | } |
271 | EOF |
266 | EOF |
|
|
267 | |
272 | my $prog = $ctx->program_with_source ($src); |
268 | my $prog = $ctx->build_program ($src); |
273 | eval { $prog->build ($dev); 1 } |
|
|
274 | or die $prog->build_log ($dev); |
|
|
275 | |
|
|
276 | my $kernel = $prog->kernel ("juliatunnel"); |
269 | my $kernel = $prog->kernel ("juliatunnel"); |
277 | |
270 | |
278 | # program compiled, kernel ready, now draw and loop |
271 | # program compiled, kernel ready, now draw and loop |
279 | |
272 | |
280 | for (my $time; ; ++$time) { |
273 | for (my $time; ; ++$time) { |
… | |
… | |
383 | |
376 | |
384 | For this to work, the OpenGL library must be loaded, a GLX context must |
377 | For this to work, the OpenGL library must be loaded, a GLX context must |
385 | have been created and be made current, and C<dlsym> must be available and |
378 | have been created and be made current, and C<dlsym> must be available and |
386 | capable of finding the function via C<RTLD_DEFAULT>. |
379 | capable of finding the function via C<RTLD_DEFAULT>. |
387 | |
380 | |
|
|
381 | =cut |
|
|
382 | |
|
|
383 | package OpenCL; |
|
|
384 | |
|
|
385 | use common::sense; |
|
|
386 | |
|
|
387 | BEGIN { |
|
|
388 | our $VERSION = '0.96'; |
|
|
389 | |
|
|
390 | require XSLoader; |
|
|
391 | XSLoader::load (__PACKAGE__, $VERSION); |
|
|
392 | |
|
|
393 | @OpenCL::Platform::ISA = |
|
|
394 | @OpenCL::Device::ISA = |
|
|
395 | @OpenCL::Context::ISA = |
|
|
396 | @OpenCL::Queue::ISA = |
|
|
397 | @OpenCL::Memory::ISA = |
|
|
398 | @OpenCL::Sampler::ISA = |
|
|
399 | @OpenCL::Program::ISA = |
|
|
400 | @OpenCL::Kernel::ISA = |
|
|
401 | @OpenCL::Event::ISA = OpenCL::Object::; |
|
|
402 | |
|
|
403 | @OpenCL::Buffer::ISA = |
|
|
404 | @OpenCL::Image::ISA = OpenCL::Memory::; |
|
|
405 | |
|
|
406 | @OpenCL::BufferObj::ISA = OpenCL::Buffer::; |
|
|
407 | |
|
|
408 | @OpenCL::Image2D::ISA = |
|
|
409 | @OpenCL::Image3D::ISA = |
|
|
410 | @OpenCL::Image2DArray::ISA = |
|
|
411 | @OpenCL::Image1D::ISA = |
|
|
412 | @OpenCL::Image1DArray::ISA = |
|
|
413 | @OpenCL::Image1DBuffer::ISA = OpenCL::Image::; |
|
|
414 | |
|
|
415 | @OpenCL::UserEvent::ISA = OpenCL::Event::; |
|
|
416 | } |
|
|
417 | |
388 | =head2 THE OpenCL PACKAGE |
418 | =head2 THE OpenCL PACKAGE |
389 | |
419 | |
390 | =over 4 |
420 | =over 4 |
391 | |
421 | |
392 | =item $int = OpenCL::errno |
422 | =item $int = OpenCL::errno |
… | |
… | |
424 | |
454 | |
425 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clWaitForEvents.html> |
455 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clWaitForEvents.html> |
426 | |
456 | |
427 | =back |
457 | =back |
428 | |
458 | |
|
|
459 | =head2 THE OpenCL::Object CLASS |
|
|
460 | |
|
|
461 | This is the base class for all objects in the OpenCL module. The only |
|
|
462 | method it implements is the C<id> method, which is only useful if you want |
|
|
463 | to interface to OpenCL on the C level. |
|
|
464 | |
|
|
465 | =over 4 |
|
|
466 | |
|
|
467 | =item $iv = $obj->id |
|
|
468 | |
|
|
469 | OpenCL objects are represented by pointers or integers on the C level. If |
|
|
470 | you want to interface to an OpenCL object directly on the C level, then |
|
|
471 | you need this value, which is returned by this method. You should use an |
|
|
472 | C<IV> type in your code and cast that to the correct type. |
|
|
473 | |
|
|
474 | =cut |
|
|
475 | |
|
|
476 | sub OpenCL::Object::id { |
|
|
477 | ${$_[0]} |
|
|
478 | } |
|
|
479 | |
|
|
480 | =back |
|
|
481 | |
429 | =head2 THE OpenCL::Platform CLASS |
482 | =head2 THE OpenCL::Platform CLASS |
430 | |
483 | |
431 | =over 4 |
484 | =over 4 |
432 | |
485 | |
433 | =item @devices = $platform->devices ($type = OpenCL::DEVICE_TYPE_ALL) |
486 | =item @devices = $platform->devices ($type = OpenCL::DEVICE_TYPE_ALL) |
… | |
… | |
456 | It's best to avoid this method and use one of the following convenience |
509 | It's best to avoid this method and use one of the following convenience |
457 | wrappers. |
510 | wrappers. |
458 | |
511 | |
459 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clGetPlatformInfo.html> |
512 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clGetPlatformInfo.html> |
460 | |
513 | |
|
|
514 | =item $platform->unload_compiler |
|
|
515 | |
|
|
516 | Attempts to unload the compiler for this platform, for endless |
|
|
517 | profit. Does nothing on OpenCL 1.1. |
|
|
518 | |
|
|
519 | L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clUnloadPlatformCompiler.html> |
|
|
520 | |
461 | =for gengetinfo begin platform |
521 | =for gengetinfo begin platform |
462 | |
522 | |
463 | =item $string = $platform->profile |
523 | =item $string = $platform->profile |
464 | |
524 | |
465 | Calls C<clGetPlatformInfo> with C<CL_PLATFORM_PROFILE> and returns the result. |
525 | Calls C<clGetPlatformInfo> with C<CL_PLATFORM_PROFILE> and returns the result. |
… | |
… | |
765 | =back |
825 | =back |
766 | |
826 | |
767 | =head2 THE OpenCL::Context CLASS |
827 | =head2 THE OpenCL::Context CLASS |
768 | |
828 | |
769 | =over 4 |
829 | =over 4 |
|
|
830 | |
|
|
831 | =item $prog = $ctx->build_program ($program, $options = "") |
|
|
832 | |
|
|
833 | This convenience function tries to build the program on all devices in |
|
|
834 | the context. If the build fails, then the function will C<croak> with the |
|
|
835 | build log. Otherwise ti returns the program object. |
|
|
836 | |
|
|
837 | The C<$program> can either be a C<OpenCL::Program> object or a string |
|
|
838 | containing the program. In the latter case, a program objetc will be |
|
|
839 | created automatically. |
|
|
840 | |
|
|
841 | =cut |
|
|
842 | |
|
|
843 | sub OpenCL::Context::build_program { |
|
|
844 | my ($self, $prog, $options) = @_; |
|
|
845 | |
|
|
846 | $prog = $self->program_with_source ($prog) |
|
|
847 | unless ref $prog; |
|
|
848 | |
|
|
849 | for my $dev ($self->devices) { |
|
|
850 | eval { $prog->build ($dev, $options); 1 } |
|
|
851 | or Carp::croak "Building OpenCL program for device '" . $dev->name . "' failed:\n" |
|
|
852 | . $prog->build_log ($dev); |
|
|
853 | } |
|
|
854 | |
|
|
855 | $prog |
|
|
856 | } |
770 | |
857 | |
771 | =item $queue = $ctx->queue ($device, $properties) |
858 | =item $queue = $ctx->queue ($device, $properties) |
772 | |
859 | |
773 | Create a new OpenCL::Queue object from the context and the given device. |
860 | Create a new OpenCL::Queue object from the context and the given device. |
774 | |
861 | |
… | |
… | |
793 | |
880 | |
794 | =item $buf = $ctx->buffer_sv ($flags, $data) |
881 | =item $buf = $ctx->buffer_sv ($flags, $data) |
795 | |
882 | |
796 | Creates a new OpenCL::Buffer (actually OpenCL::BufferObj) object and |
883 | Creates a new OpenCL::Buffer (actually OpenCL::BufferObj) object and |
797 | initialise it with the given data values. |
884 | initialise it with the given data values. |
|
|
885 | |
|
|
886 | =item $img = $ctx->image ($self, $flags, $channel_order, $channel_type, $type, $width, $height, $depth, $array_size = 0, $row_pitch = 0, $slice_pitch = 0, $num_mip_level = 0, $num_samples = 0, $*data = &PL_sv_undef) |
|
|
887 | |
|
|
888 | Creates a new OpenCL::Image object and optionally initialises it with |
|
|
889 | the given data values. |
|
|
890 | |
|
|
891 | L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clCreateImage.html> |
798 | |
892 | |
799 | =item $img = $ctx->image2d ($flags, $channel_order, $channel_type, $width, $height, $row_pitch = 0, $data = undef) |
893 | =item $img = $ctx->image2d ($flags, $channel_order, $channel_type, $width, $height, $row_pitch = 0, $data = undef) |
800 | |
894 | |
801 | Creates a new OpenCL::Image2D object and optionally initialises it with |
895 | Creates a new OpenCL::Image2D object and optionally initialises it with |
802 | the given data values. |
896 | the given data values. |
… | |
… | |
966 | |
1060 | |
967 | Yeah. |
1061 | Yeah. |
968 | |
1062 | |
969 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueCopyBufferToImage.html>. |
1063 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueCopyBufferToImage.html>. |
970 | |
1064 | |
|
|
1065 | =item $ev = $queue->enqueue_fill_buffer ($mem, $pattern, $offset, $size, ...) |
|
|
1066 | |
|
|
1067 | Fills the given buffer object with repeated applications of C<$pattern>, |
|
|
1068 | starting at C<$offset> for C<$size> octets. |
|
|
1069 | |
|
|
1070 | L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clEnqueueFillBuffer.html> |
|
|
1071 | |
|
|
1072 | =item $ev = $queue->enqueue_fill_image ($img, $r, $g, $b, $a, $x, $y, $z, $width, $height, $depth, ...) |
|
|
1073 | |
|
|
1074 | Fills the given image area with the given rgba colour components. The |
|
|
1075 | components are normally floating point values between C<0> and C<1>, |
|
|
1076 | except when the image channel data type is a signe dor unsigned |
|
|
1077 | unnormalised format, in which case the range is determined by the format. |
|
|
1078 | |
|
|
1079 | L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clEnqueueFillImage.html> |
|
|
1080 | |
971 | =item $ev = $queue->enqueue_task ($kernel, $wait_events...) |
1081 | =item $ev = $queue->enqueue_task ($kernel, $wait_events...) |
972 | |
1082 | |
973 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueTask.html> |
1083 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueTask.html> |
974 | |
1084 | |
975 | =item $ev = $queue->enqueue_nd_range_kernel ($kernel, @$global_work_offset, @$global_work_size, @$local_work_size, $wait_events...) |
1085 | =item $ev = $queue->enqueue_nd_range_kernel ($kernel, @$global_work_offset, @$global_work_size, @$local_work_size, $wait_events...) |
… | |
… | |
1143 | OpenCL::Image1DArray, OpenCL::Image1DBuffer, OpenCL::Image2D, |
1253 | OpenCL::Image1DArray, OpenCL::Image1DBuffer, OpenCL::Image2D, |
1144 | OpenCL::Image2DArray and OpenCL::Image3D. |
1254 | OpenCL::Image2DArray and OpenCL::Image3D. |
1145 | |
1255 | |
1146 | =over 4 |
1256 | =over 4 |
1147 | |
1257 | |
1148 | =item $packed_value = $ev->image_info ($name) |
1258 | =item $packed_value = $image->image_info ($name) |
1149 | |
1259 | |
1150 | See C<< $platform->info >> for details. |
1260 | See C<< $platform->info >> for details. |
1151 | |
1261 | |
1152 | The reason this method is not called C<info> is that there already is an |
1262 | The reason this method is not called C<info> is that there already is an |
1153 | C<< ->info >> method inherited from C<OpenCL::Memory>. |
1263 | C<< ->info >> method inherited from C<OpenCL::Memory>. |
1154 | |
1264 | |
1155 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clGetImageInfo.html> |
1265 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clGetImageInfo.html> |
1156 | |
1266 | |
|
|
1267 | =item ($channel_order, $channel_data_type) = $image->format |
|
|
1268 | |
|
|
1269 | Returns the channel order and type used to create the image by calling |
|
|
1270 | C<clGetImageInfo> with C<CL_IMAGE_FORMAT>. |
|
|
1271 | |
1157 | =for gengetinfo begin image |
1272 | =for gengetinfo begin image |
1158 | |
1273 | |
1159 | =item $int = $image->element_size |
1274 | =item $int = $image->element_size |
1160 | |
1275 | |
1161 | Calls C<clGetImageInfo> with C<CL_IMAGE_ELEMENT_SIZE> and returns the result. |
1276 | Calls C<clGetImageInfo> with C<CL_IMAGE_ELEMENT_SIZE> and returns the result. |
… | |
… | |
1236 | |
1351 | |
1237 | =over 4 |
1352 | =over 4 |
1238 | |
1353 | |
1239 | =item $program->build ($device, $options = "") |
1354 | =item $program->build ($device, $options = "") |
1240 | |
1355 | |
1241 | Tries to build the program with the givne options. |
1356 | Tries to build the program with the given options. See also the |
|
|
1357 | C<$ctx->build> convenience function. |
1242 | |
1358 | |
1243 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clBuildProgram.html> |
1359 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clBuildProgram.html> |
1244 | |
1360 | |
1245 | =item $packed_value = $program->build_info ($device, $name) |
1361 | =item $packed_value = $program->build_info ($device, $name) |
1246 | |
1362 | |
… | |
… | |
1253 | |
1369 | |
1254 | Creates an OpenCL::Kernel object out of the named C<__kernel> function in |
1370 | Creates an OpenCL::Kernel object out of the named C<__kernel> function in |
1255 | the program. |
1371 | the program. |
1256 | |
1372 | |
1257 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateKernel.html> |
1373 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateKernel.html> |
|
|
1374 | |
|
|
1375 | =item @kernels = $program->kernels_in_program |
|
|
1376 | |
|
|
1377 | Returns all kernels successfully compiled for all devices in program. |
|
|
1378 | |
|
|
1379 | http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateKernelsInProgram.html |
1258 | |
1380 | |
1259 | =for gengetinfo begin program_build |
1381 | =for gengetinfo begin program_build |
1260 | |
1382 | |
1261 | =item $build_status = $program->build_status ($device) |
1383 | =item $build_status = $program->build_status ($device) |
1262 | |
1384 | |
… | |
… | |
1398 | float and double as floating point values, memory/buffer/image2d/image3d |
1520 | float and double as floating point values, memory/buffer/image2d/image3d |
1399 | must be an object of that type or C<undef>, local-memory arguments are |
1521 | must be an object of that type or C<undef>, local-memory arguments are |
1400 | set by specifying the size, and sampler and event must be objects of that |
1522 | set by specifying the size, and sampler and event must be objects of that |
1401 | type. |
1523 | type. |
1402 | |
1524 | |
|
|
1525 | Setting an argument for a kernel does NOT keep a reference to the object - |
|
|
1526 | for example, if you set an argument to some image object, free the image, |
|
|
1527 | and call the kernel, you will run into undefined behaviour. |
|
|
1528 | |
1403 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clSetKernelArg.html> |
1529 | L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clSetKernelArg.html> |
1404 | |
1530 | |
1405 | =back |
1531 | =back |
1406 | |
1532 | |
1407 | =head2 THE OpenCL::Event CLASS |
1533 | =head2 THE OpenCL::Event CLASS |
… | |
… | |
1490 | |
1616 | |
1491 | =back |
1617 | =back |
1492 | |
1618 | |
1493 | =cut |
1619 | =cut |
1494 | |
1620 | |
1495 | package OpenCL; |
|
|
1496 | |
|
|
1497 | use common::sense; |
|
|
1498 | |
|
|
1499 | BEGIN { |
|
|
1500 | our $VERSION = '0.96'; |
|
|
1501 | |
|
|
1502 | require XSLoader; |
|
|
1503 | XSLoader::load (__PACKAGE__, $VERSION); |
|
|
1504 | |
|
|
1505 | @OpenCL::Buffer::ISA = |
|
|
1506 | @OpenCL::Image::ISA = OpenCL::Memory::; |
|
|
1507 | |
|
|
1508 | @OpenCL::BufferObj::ISA = OpenCL::Buffer::; |
|
|
1509 | |
|
|
1510 | @OpenCL::Image2D::ISA = |
|
|
1511 | @OpenCL::Image3D::ISA = |
|
|
1512 | @OpenCL::Image2DArray::ISA = |
|
|
1513 | @OpenCL::Image1D::ISA = |
|
|
1514 | @OpenCL::Image1DArray::ISA = |
|
|
1515 | @OpenCL::Image1DBuffer::ISA = OpenCL::Image::; |
|
|
1516 | |
|
|
1517 | @OpenCL::UserEvent::ISA = OpenCL::Event::; |
|
|
1518 | } |
|
|
1519 | |
|
|
1520 | 1; |
1621 | 1; |
1521 | |
1622 | |
1522 | =head1 AUTHOR |
1623 | =head1 AUTHOR |
1523 | |
1624 | |
1524 | Marc Lehmann <schmorp@schmorp.de> |
1625 | Marc Lehmann <schmorp@schmorp.de> |