ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/OpenCL/OpenCL.pm
(Generate patch)

Comparing OpenCL/OpenCL.pm (file contents):
Revision 1.36 by root, Thu Apr 19 14:34:56 2012 UTC vs.
Revision 1.49 by root, Sat Apr 21 20:48:03 2012 UTC

160 '; 160 ';
161 161
162 my $prog = $ctx->program_with_source ($src); 162 my $prog = $ctx->program_with_source ($src);
163 163
164 # build croaks on compile errors, so catch it and print the compile errors 164 # build croaks on compile errors, so catch it and print the compile errors
165 eval { $prog->build ($dev); 1 } 165 eval { $prog->build ($dev, "-cl-fast-relaxed-math"); 1 }
166 or die $prog->build_log; 166 or die $prog->build_log;
167 167
168 my $kernel = $prog->kernel ("squareit"); 168 my $kernel = $prog->kernel ("squareit");
169 169
170=head2 Create some input and output float buffers, then call the 170=head2 Create some input and output float buffers, then call the
210 # enqueue an async read 210 # enqueue an async read
211 $ev = $queue->enqueue_read_buffer ($output, 0, 0, OpenCL::SIZEOF_FLOAT * 4, my $data, $ev); 211 $ev = $queue->enqueue_read_buffer ($output, 0, 0, OpenCL::SIZEOF_FLOAT * 4, my $data, $ev);
212 212
213 # wait for the last event to complete 213 # wait for the last event to complete
214 $ev->wait; 214 $ev->wait;
215
216=head2 Use the OpenGL module to share a texture between OpenCL and OpenGL and draw some julia
217set tunnel effect.
218
219This is quite a long example to get you going.
220
221 use OpenGL ":all";
222 use OpenCL;
223
224 # open a window and create a gl texture
225 OpenGL::glpOpenWindow width => 256, height => 256;
226 my $texid = glGenTextures_p 1;
227 glBindTexture GL_TEXTURE_2D, $texid;
228 glTexImage2D_c GL_TEXTURE_2D, 0, GL_RGBA8, 256, 256, 0, GL_RGBA, GL_UNSIGNED_BYTE, 0;
229
230 # find and use the first opencl device that let's us get a shared opengl context
231 my $platform;
232 my $dev;
233 my $ctx;
234
235 for (OpenCL::platforms) {
236 $platform = $_;
237 for ($platform->devices) {
238 $dev = $_;
239 $ctx = $platform->context ([OpenCL::GLX_DISPLAY_KHR, undef, OpenCL::GL_CONTEXT_KHR, undef], [$dev])
240 and last;
241 }
242 }
243
244 $ctx
245 or die "cannot find suitable OpenCL device\n";
246
247 my $queue = $ctx->queue ($dev);
248
249 # now attach an opencl image2d object to the opengl texture
250 my $tex = $ctx->gl_texture2d (OpenCL::MEM_WRITE_ONLY, GL_TEXTURE_2D, 0, $texid);
251
252 # now the boring opencl code
253 my $src = <<EOF;
254 kernel void
255 juliatunnel (write_only image2d_t img, float time)
256 {
257 float2 p = (float2)(get_global_id (0), get_global_id (1)) / 256.f * 2.f - 1.f;
258
259 float2 m = (float2)(1.f, p.y) / fabs (p.x);
260 m.x = fabs (fmod (m.x + time * 0.05f, 4.f)) - 2.f;
261
262 float2 z = m;
263 float2 c = (float2)(sin (time * 0.05005), cos (time * 0.06001));
264
265 for (int i = 0; i < 25 && dot (z, z) < 4.f; ++i)
266 z = (float2)(z.x * z.x - z.y * z.y, 2.f * z.x * z.y) + c;
267
268 float3 colour = (float3)(z.x, z.y, z.x * z.y);
269 write_imagef (img, (int2)(get_global_id (0), get_global_id (1)), (float4)(colour * p.x * p.x, 1.));
270 }
271 EOF
272 my $prog = $ctx->program_with_source ($src);
273 eval { $prog->build ($dev); 1 }
274 or die $prog->build_log ($dev);
275
276 my $kernel = $prog->kernel ("juliatunnel");
277
278 # program compiled, kernel ready, now draw and loop
279
280 for (my $time; ; ++$time) {
281 # acquire objects from opengl
282 $queue->enqueue_acquire_gl_objects ([$tex]);
283
284 # configure and run our kernel
285 $kernel->set_image2d (0, $tex);
286 $kernel->set_float (1, $time);
287 $queue->enqueue_nd_range_kernel ($kernel, undef, [256, 256], undef);
288
289 # release objects to opengl again
290 $queue->enqueue_release_gl_objects ([$tex]);
291
292 # wait
293 $queue->finish;
294
295 # now draw the texture, the defaults should be all right
296 glTexParameterf GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_NEAREST;
297
298 glEnable GL_TEXTURE_2D;
299 glBegin GL_QUADS;
300 glTexCoord2f 0, 1; glVertex3i -1, -1, -1;
301 glTexCoord2f 0, 0; glVertex3i 1, -1, -1;
302 glTexCoord2f 1, 0; glVertex3i 1, 1, -1;
303 glTexCoord2f 1, 1; glVertex3i -1, 1, -1;
304 glEnd;
305
306 glXSwapBuffers;
307
308 select undef, undef, undef, 1/60;
309 }
215 310
216=head1 DOCUMENTATION 311=head1 DOCUMENTATION
217 312
218=head2 BASIC CONVENTIONS 313=head2 BASIC CONVENTIONS
219 314
241=item * Structures are often specified by flattening out their components 336=item * Structures are often specified by flattening out their components
242as with short vectors, and returned as arrayrefs. 337as with short vectors, and returned as arrayrefs.
243 338
244=item * When enqueuing commands, the wait list is specified by adding 339=item * When enqueuing commands, the wait list is specified by adding
245extra arguments to the function - anywhere a C<$wait_events...> argument 340extra arguments to the function - anywhere a C<$wait_events...> argument
246is documented this can be any number of event objects. 341is documented this can be any number of event objects. As an extsnion
342implemented by this module, C<undef> values will be ignored in the event
343list.
247 344
248=item * When enqueuing commands, if the enqueue method is called in void 345=item * When enqueuing commands, if the enqueue method is called in void
249context, no event is created. In all other contexts an event is returned 346context, no event is created. In all other contexts an event is returned
250by the method. 347by the method.
251 348
275 372
276=head2 GLX SUPPORT 373=head2 GLX SUPPORT
277 374
278Due to the sad state that OpenGL support is in in Perl (mostly the OpenGL 375Due to the sad state that OpenGL support is in in Perl (mostly the OpenGL
279module, which has little to no documentation and has little to no support 376module, which has little to no documentation and has little to no support
280for glx), this module, as a special extension, treats context creation 377for glX), this module, as a special extension, treats context creation
281properties C<OpenCL::GLX_DISPLAY_KHR> and C<OpenCL::GL_CONTEXT_KHR> 378properties C<OpenCL::GLX_DISPLAY_KHR> and C<OpenCL::GL_CONTEXT_KHR>
282specially: If either or both of these are C<undef>, then the OpenCL 379specially: If either or both of these are C<undef>, then the OpenCL
283module tries to dynamically resolve C<glxGetCurrentDisplay> and 380module tries to dynamically resolve C<glXGetCurrentDisplay> and
284C<glxGetCurrentContext>, call these functions and use their return values 381C<glXGetCurrentContext>, call these functions and use their return values
285instead. 382instead.
286 383
287For this to work, the OpenGL library must be loaded, a GLX context must 384For this to work, the OpenGL library must be loaded, a GLX context must
288have been created and be made current, and C<dlsym> must be available and 385have been created and be made current, and C<dlsym> must be available and
289capable of finding the function via C<RTLD_DEFAULT>. 386capable of finding the function via C<RTLD_DEFAULT>.
653 750
654=item @device_partition_property_exts = $device->affinity_domains_ext 751=item @device_partition_property_exts = $device->affinity_domains_ext
655 752
656Calls C<clGetDeviceInfo> with C<CL_DEVICE_AFFINITY_DOMAINS_EXT> and returns the result. 753Calls C<clGetDeviceInfo> with C<CL_DEVICE_AFFINITY_DOMAINS_EXT> and returns the result.
657 754
658=item $uint = $device->reference_count_ext 755=item $uint = $device->reference_count_ext
659 756
660Calls C<clGetDeviceInfo> with C<CL_DEVICE_REFERENCE_COUNT_EXT > and returns the result. 757Calls C<clGetDeviceInfo> with C<CL_DEVICE_REFERENCE_COUNT_EXT> and returns the result.
661 758
662=item @device_partition_property_exts = $device->partition_style_ext 759=item @device_partition_property_exts = $device->partition_style_ext
663 760
664Calls C<clGetDeviceInfo> with C<CL_DEVICE_PARTITION_STYLE_EXT> and returns the result. 761Calls C<clGetDeviceInfo> with C<CL_DEVICE_PARTITION_STYLE_EXT> and returns the result.
665 762
674=item $queue = $ctx->queue ($device, $properties) 771=item $queue = $ctx->queue ($device, $properties)
675 772
676Create a new OpenCL::Queue object from the context and the given device. 773Create a new OpenCL::Queue object from the context and the given device.
677 774
678L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateCommandQueue.html> 775L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateCommandQueue.html>
776
777Example: create an out-of-order queue.
778
779 $queue = $ctx->queue ($device, OpenCL::QUEUE_OUT_OF_ORDER_EXEC_MODE_ENABLE);
679 780
680=item $ev = $ctx->user_event 781=item $ev = $ctx->user_event
681 782
682Creates a new OpenCL::UserEvent object. 783Creates a new OpenCL::UserEvent object.
683 784
693=item $buf = $ctx->buffer_sv ($flags, $data) 794=item $buf = $ctx->buffer_sv ($flags, $data)
694 795
695Creates a new OpenCL::Buffer (actually OpenCL::BufferObj) object and 796Creates a new OpenCL::Buffer (actually OpenCL::BufferObj) object and
696initialise it with the given data values. 797initialise it with the given data values.
697 798
799=item $img = $ctx->image ($self, $flags, $channel_order, $channel_type, $type, $width, $height, $depth, $array_size = 0, $row_pitch = 0, $slice_pitch = 0, $num_mip_level = 0, $num_samples = 0, $*data = &PL_sv_undef)
800
801Creates a new OpenCL::Image object and optionally initialises it with
802the given data values.
803
804L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clCreateImage.html>
805
698=item $img = $ctx->image2d ($flags, $channel_order, $channel_type, $width, $height, $row_pitch = 0, $data = undef) 806=item $img = $ctx->image2d ($flags, $channel_order, $channel_type, $width, $height, $row_pitch = 0, $data = undef)
699 807
700Creates a new OpenCL::Image2D object and optionally initialises it with 808Creates a new OpenCL::Image2D object and optionally initialises it with
701the given data values. 809the given data values.
702 810
714Creates a new OpenCL::Buffer (actually OpenCL::BufferObj) object that refers to the given 822Creates a new OpenCL::Buffer (actually OpenCL::BufferObj) object that refers to the given
715OpenGL buffer object. 823OpenGL buffer object.
716 824
717http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateFromGLBuffer.html 825http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateFromGLBuffer.html
718 826
827=item $img = $ctx->gl_texture ($flags, $target, $miplevel, $texture)
828
829Creates a new OpenCL::Image object that refers to the given OpenGL
830texture object or buffer.
831
832http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clCreateFromGLTexture.html
833
719=item $ctx->gl_texture2d ($flags, $target, $miplevel, $texture) 834=item $img = $ctx->gl_texture2d ($flags, $target, $miplevel, $texture)
720 835
721Creates a new OpenCL::Image2D object that refers to the given OpenGL 836Creates a new OpenCL::Image2D object that refers to the given OpenGL
7222D texture object. 8372D texture object.
723 838
724http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateFromGLTexture2D.html 839http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateFromGLTexture2D.html
725 840
726=item $ctx->gl_texture3d ($flags, $target, $miplevel, $texture) 841=item $img = $ctx->gl_texture3d ($flags, $target, $miplevel, $texture)
727 842
728Creates a new OpenCL::Image3D object that refers to the given OpenGL 843Creates a new OpenCL::Image3D object that refers to the given OpenGL
7293D texture object. 8443D texture object.
730 845
731http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateFromGLTexture3D.html 846http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clCreateFromGLTexture3D.html
794for completion, unless the method is called in void context, in which case 909for completion, unless the method is called in void context, in which case
795no event object is created. 910no event object is created.
796 911
797They also allow you to specify any number of other event objects that this 912They also allow you to specify any number of other event objects that this
798request has to wait for before it starts executing, by simply passing the 913request has to wait for before it starts executing, by simply passing the
799event objects as extra parameters to the enqueue methods. 914event objects as extra parameters to the enqueue methods. To simplify
915program design, this module ignores any C<undef> values in the list of
916events. This makes it possible to code operations such as this, without
917having to put a valid event object into C<$event> first:
918
919 $event = $queue->enqueue_xxx (..., $event);
800 920
801Queues execute in-order by default, without any parallelism, so in most 921Queues execute in-order by default, without any parallelism, so in most
802cases (i.e. you use only one queue) it's not necessary to wait for or 922cases (i.e. you use only one queue) it's not necessary to wait for or
803create event objects. 923create event objects, althoguh an our of order queue is often a bit
924faster.
804 925
805=over 4 926=over 4
806 927
807=item $ev = $queue->enqueue_read_buffer ($buffer, $blocking, $offset, $len, $data, $wait_events...) 928=item $ev = $queue->enqueue_read_buffer ($buffer, $blocking, $offset, $len, $data, $wait_events...)
808 929
874reference to an array of local work sizes, with the same number of 995reference to an array of local work sizes, with the same number of
875elements as @$global_work_size. 996elements as @$global_work_size.
876 997
877L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueNDRangeKernel.html> 998L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueNDRangeKernel.html>
878 999
879=item $ev = $queue->enqueue_marker ($wait_events...)
880
881L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueMarker.html>
882
883=item $ev = $queue->enqueue_acquire_gl_objects ([object, ...], $wait_events...) 1000=item $ev = $queue->enqueue_acquire_gl_objects ([object, ...], $wait_events...)
884 1001
885Enqueues a list (an array-ref of OpenCL::Memory objects) to be acquired 1002Enqueues a list (an array-ref of OpenCL::Memory objects) to be acquired
886for subsequent OpenCL usage. 1003for subsequent OpenCL usage.
887 1004
896 1013
897=item $ev = $queue->enqueue_wait_for_events ($wait_events...) 1014=item $ev = $queue->enqueue_wait_for_events ($wait_events...)
898 1015
899L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWaitForEvents.html> 1016L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueWaitForEvents.html>
900 1017
901=item $queue->enqueue_barrier 1018=item $ev = $queue->enqueue_marker ($wait_events...)
902 1019
1020L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clEnqueueMarkerWithWaitList.html>
1021
1022=item $ev = $queue->enqueue_barrier ($wait_events...)
1023
903L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clEnqueueBarrier.html> 1024L<http://www.khronos.org/registry/cl/sdk/1.2/docs/man/xhtml/clEnqueueBarrierWithWaitList.html>
904 1025
905=item $queue->flush 1026=item $queue->flush
906 1027
907L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clFlush.html> 1028L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clFlush.html>
908 1029
1023 1144
1024=back 1145=back
1025 1146
1026=head2 THE OpenCL::Image CLASS 1147=head2 THE OpenCL::Image CLASS
1027 1148
1028This is the superclass of all image objects - OpenCL::Image2D and OpenCL::Image3D. 1149This is the superclass of all image objects - OpenCL::Image1D,
1150OpenCL::Image1DArray, OpenCL::Image1DBuffer, OpenCL::Image2D,
1151OpenCL::Image2DArray and OpenCL::Image3D.
1029 1152
1030=over 4 1153=over 4
1031 1154
1032=item $packed_value = $ev->image_info ($name) 1155=item $packed_value = $ev->image_info ($name)
1033 1156
1068 1191
1069=for gengetinfo begin gl_texture 1192=for gengetinfo begin gl_texture
1070 1193
1071=item $GLenum = $gl_texture->target 1194=item $GLenum = $gl_texture->target
1072 1195
1073Calls C<clGetGlTextureInfo> with C<CL_GL_TEXTURE_TARGET> and returns the result. 1196Calls C<clGetGLTextureInfo> with C<CL_GL_TEXTURE_TARGET> and returns the result.
1074 1197
1075=item $GLint = $gl_texture->gl_mipmap_level 1198=item $GLint = $gl_texture->gl_mipmap_level
1076 1199
1077Calls C<clGetGlTextureInfo> with C<CL_GL_MIPMAP_LEVEL> and returns the result. 1200Calls C<clGetGLTextureInfo> with C<CL_GL_MIPMAP_LEVEL> and returns the result.
1078 1201
1079=for gengetinfo end gl_texture 1202=for gengetinfo end gl_texture
1080 1203
1081=back 1204=back
1082 1205
1274 1397
1275This is a family of methods to set the kernel argument with the number C<$index> to the give C<$value>. 1398This is a family of methods to set the kernel argument with the number C<$index> to the give C<$value>.
1276 1399
1277TYPE is one of C<char>, C<uchar>, C<short>, C<ushort>, C<int>, C<uint>, 1400TYPE is one of C<char>, C<uchar>, C<short>, C<ushort>, C<int>, C<uint>,
1278C<long>, C<ulong>, C<half>, C<float>, C<double>, C<memory>, C<buffer>, 1401C<long>, C<ulong>, C<half>, C<float>, C<double>, C<memory>, C<buffer>,
1279C<image2d>, C<image3d>, C<sampler> or C<event>. 1402C<image2d>, C<image3d>, C<sampler>, C<local> or C<event>.
1280 1403
1281Chars and integers (including the half type) are specified as integers, 1404Chars and integers (including the half type) are specified as integers,
1282float and double as floating point values, memory/buffer/image2d/image3d 1405float and double as floating point values, memory/buffer/image2d/image3d
1283must be an object of that type or C<undef>, and sampler and event must be 1406must be an object of that type or C<undef>, local-memory arguments are
1284objects of that type. 1407set by specifying the size, and sampler and event must be objects of that
1408type.
1285 1409
1286L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clSetKernelArg.html> 1410L<http://www.khronos.org/registry/cl/sdk/1.1/docs/man/xhtml/clSetKernelArg.html>
1287 1411
1288=back 1412=back
1289 1413
1378package OpenCL; 1502package OpenCL;
1379 1503
1380use common::sense; 1504use common::sense;
1381 1505
1382BEGIN { 1506BEGIN {
1383 our $VERSION = '0.92'; 1507 our $VERSION = '0.96';
1384 1508
1385 require XSLoader; 1509 require XSLoader;
1386 XSLoader::load (__PACKAGE__, $VERSION); 1510 XSLoader::load (__PACKAGE__, $VERSION);
1387 1511
1388 @OpenCL::Buffer::ISA = 1512 @OpenCL::Buffer::ISA =
1389 @OpenCL::Image::ISA = OpenCL::Memory::; 1513 @OpenCL::Image::ISA = OpenCL::Memory::;
1390 1514
1391 @OpenCL::BufferObj::ISA = OpenCL::Buffer::; 1515 @OpenCL::BufferObj::ISA = OpenCL::Buffer::;
1392 1516
1393 @OpenCL::Image2D::ISA = 1517 @OpenCL::Image2D::ISA =
1518 @OpenCL::Image3D::ISA =
1519 @OpenCL::Image2DArray::ISA =
1520 @OpenCL::Image1D::ISA =
1521 @OpenCL::Image1DArray::ISA =
1394 @OpenCL::Image3D::ISA = OpenCL::Image::; 1522 @OpenCL::Image1DBuffer::ISA = OpenCL::Image::;
1395 1523
1396 @OpenCL::UserEvent::ISA = OpenCL::Event::; 1524 @OpenCL::UserEvent::ISA = OpenCL::Event::;
1397} 1525}
1398 1526
13991; 15271;
1400 1528
1401=head1 AUTHOR 1529=head1 AUTHOR

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines