ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/IO-AIO/AIO.pm
(Generate patch)

Comparing IO-AIO/AIO.pm (file contents):
Revision 1.52 by root, Sat Oct 21 23:06:04 2006 UTC vs.
Revision 1.61 by root, Sun Oct 22 13:52:11 2006 UTC

15 15
16 aio_read $fh, 30000, 1024, $buffer, 0, sub { 16 aio_read $fh, 30000, 1024, $buffer, 0, sub {
17 $_[0] > 0 or die "read error: $!"; 17 $_[0] > 0 or die "read error: $!";
18 }; 18 };
19 19
20 use IO::AIO 2; # version has aio objects 20 # version 2+ has request and group objects
21 use IO::AIO 2;
21 22
22 my $req = aio_unlink "/tmp/file", sub { }; 23 my $req = aio_unlink "/tmp/file", sub { };
23 $req->cancel; # cancel request if still in queue 24 $req->cancel; # cancel request if still in queue
24 25
25 # AnyEvent 26 my $grp = aio_group sub { print "all stats done\n" };
27 add $grp aio_stat "..." for ...;
28
29 # AnyEvent integration
26 open my $fh, "<&=" . IO::AIO::poll_fileno or die "$!"; 30 open my $fh, "<&=" . IO::AIO::poll_fileno or die "$!";
27 my $w = AnyEvent->io (fh => $fh, poll => 'r', cb => sub { IO::AIO::poll_cb }); 31 my $w = AnyEvent->io (fh => $fh, poll => 'r', cb => sub { IO::AIO::poll_cb });
28 32
29 # Event 33 # Event integration
30 Event->io (fd => IO::AIO::poll_fileno, 34 Event->io (fd => IO::AIO::poll_fileno,
31 poll => 'r', 35 poll => 'r',
32 cb => \&IO::AIO::poll_cb); 36 cb => \&IO::AIO::poll_cb);
33 37
34 # Glib/Gtk2 38 # Glib/Gtk2 integration
35 add_watch Glib::IO IO::AIO::poll_fileno, 39 add_watch Glib::IO IO::AIO::poll_fileno,
36 in => sub { IO::AIO::poll_cb; 1 }; 40 in => sub { IO::AIO::poll_cb; 1 };
37 41
38 # Tk 42 # Tk integration
39 Tk::Event::IO->fileevent (IO::AIO::poll_fileno, "", 43 Tk::Event::IO->fileevent (IO::AIO::poll_fileno, "",
40 readable => \&IO::AIO::poll_cb); 44 readable => \&IO::AIO::poll_cb);
41 45
42 # Danga::Socket 46 # Danga::Socket integration
43 Danga::Socket->AddOtherFds (IO::AIO::poll_fileno => 47 Danga::Socket->AddOtherFds (IO::AIO::poll_fileno =>
44 \&IO::AIO::poll_cb); 48 \&IO::AIO::poll_cb);
45
46 49
47=head1 DESCRIPTION 50=head1 DESCRIPTION
48 51
49This module implements asynchronous I/O using whatever means your 52This module implements asynchronous I/O using whatever means your
50operating system supports. 53operating system supports.
71use strict 'vars'; 74use strict 'vars';
72 75
73use base 'Exporter'; 76use base 'Exporter';
74 77
75BEGIN { 78BEGIN {
76 our $VERSION = '1.8'; 79 our $VERSION = '2.0';
77 80
78 our @EXPORT = qw(aio_sendfile aio_read aio_write aio_open aio_close aio_stat 81 our @EXPORT = qw(aio_sendfile aio_read aio_write aio_open aio_close aio_stat
79 aio_lstat aio_unlink aio_rmdir aio_readdir aio_scandir aio_symlink 82 aio_lstat aio_unlink aio_rmdir aio_readdir aio_scandir aio_symlink
80 aio_fsync aio_fdatasync aio_readahead aio_rename aio_link aio_move); 83 aio_fsync aio_fdatasync aio_readahead aio_rename aio_link aio_move
84 aio_group);
81 our @EXPORT_OK = qw(poll_fileno poll_cb min_parallel max_parallel max_outstanding nreqs); 85 our @EXPORT_OK = qw(poll_fileno poll_cb min_parallel max_parallel max_outstanding nreqs);
86
87 @IO::AIO::GRP::ISA = 'IO::AIO::REQ';
82 88
83 require XSLoader; 89 require XSLoader;
84 XSLoader::load ("IO::AIO", $VERSION); 90 XSLoader::load ("IO::AIO", $VERSION);
85} 91}
86 92
97syscall has been executed asynchronously. 103syscall has been executed asynchronously.
98 104
99All functions expecting a filehandle keep a copy of the filehandle 105All functions expecting a filehandle keep a copy of the filehandle
100internally until the request has finished. 106internally until the request has finished.
101 107
102All non-composite requests (requests that are not broken down into
103multiple requests) return objects of type L<IO::AIO::REQ> that allow 108All requests return objects of type L<IO::AIO::REQ> that allow further
104further manipulation of running requests. 109manipulation of those requests while they are in-flight.
105 110
106The pathnames you pass to these routines I<must> be absolute and 111The pathnames you pass to these routines I<must> be absolute and
107encoded in byte form. The reason for the former is that at the time the 112encoded in byte form. The reason for the former is that at the time the
108request is being executed, the current working directory could have 113request is being executed, the current working directory could have
109changed. Alternatively, you can make sure that you never change the 114changed. Alternatively, you can make sure that you never change the
177 print "read $_[0] bytes: <$buffer>\n"; 182 print "read $_[0] bytes: <$buffer>\n";
178 }; 183 };
179 184
180=item aio_move $srcpath, $dstpath, $callback->($status) 185=item aio_move $srcpath, $dstpath, $callback->($status)
181 186
187[EXPERIMENTAL due to internal aio_group use]
188
182Try to move the I<file> (directories not supported as either source or 189Try to move the I<file> (directories not supported as either source or
183destination) from C<$srcpath> to C<$dstpath> and call the callback with 190destination) from C<$srcpath> to C<$dstpath> and call the callback with
184the C<0> (error) or C<-1> ok. 191the C<0> (error) or C<-1> ok.
185 192
186This is a composite request that tries to rename(2) the file first. If 193This is a composite request that tries to rename(2) the file first. If
196=cut 203=cut
197 204
198sub aio_move($$$) { 205sub aio_move($$$) {
199 my ($src, $dst, $cb) = @_; 206 my ($src, $dst, $cb) = @_;
200 207
208 my $grp = aio_group $cb;
209
201 aio_rename $src, $dst, sub { 210 add $grp aio_rename $src, $dst, sub {
202 if ($_[0] && $! == EXDEV) { 211 if ($_[0] && $! == EXDEV) {
203 aio_open $src, O_RDONLY, 0, sub { 212 add $grp aio_open $src, O_RDONLY, 0, sub {
204 if (my $src_fh = $_[0]) { 213 if (my $src_fh = $_[0]) {
205 my @stat = stat $src_fh; 214 my @stat = stat $src_fh;
206 215
207 aio_open $dst, O_WRONLY, 0200, sub { 216 add $grp aio_open $dst, O_WRONLY, 0200, sub {
208 if (my $dst_fh = $_[0]) { 217 if (my $dst_fh = $_[0]) {
209 aio_sendfile $dst_fh, $src_fh, 0, $stat[7], sub { 218 add $grp aio_sendfile $dst_fh, $src_fh, 0, $stat[7], sub {
210 close $src_fh; 219 close $src_fh;
211 220
212 if ($_[0] == $stat[7]) { 221 if ($_[0] == $stat[7]) {
213 utime $stat[8], $stat[9], $dst; 222 utime $stat[8], $stat[9], $dst;
214 chmod $stat[2] & 07777, $dst_fh; 223 chmod $stat[2] & 07777, $dst_fh;
215 chown $stat[4], $stat[5], $dst_fh; 224 chown $stat[4], $stat[5], $dst_fh;
216 close $dst_fh; 225 close $dst_fh;
217 226
218 aio_unlink $src, sub { 227 add $grp aio_unlink $src, sub {
219 $cb->($_[0]); 228 $grp->result ($_[0]);
220 }; 229 };
221 } else { 230 } else {
222 my $errno = $!; 231 my $errno = $!;
223 aio_unlink $dst, sub { 232 add $grp aio_unlink $dst, sub {
224 $! = $errno; 233 $! = $errno;
225 $cb->(-1); 234 $grp->result (-1);
226 }; 235 };
227 } 236 }
228 }; 237 };
229 } else { 238 } else {
230 $cb->(-1); 239 $grp->result (-1);
231 } 240 }
232 }, 241 },
233 242
234 } else { 243 } else {
235 $cb->(-1); 244 $grp->result (-1);
236 } 245 }
237 }; 246 };
238 } else { 247 } else {
239 $cb->($_[0]); 248 $grp->result ($_[0]);
240 } 249 }
241 }; 250 };
251
252 $grp
242} 253}
243 254
244=item aio_sendfile $out_fh, $in_fh, $in_offset, $length, $callback->($retval) 255=item aio_sendfile $out_fh, $in_fh, $in_offset, $length, $callback->($retval)
245 256
246Tries to copy C<$length> bytes from C<$in_fh> to C<$out_fh>. It starts 257Tries to copy C<$length> bytes from C<$in_fh> to C<$out_fh>. It starts
334The callback a single argument which is either C<undef> or an array-ref 345The callback a single argument which is either C<undef> or an array-ref
335with the filenames. 346with the filenames.
336 347
337=item aio_scandir $path, $maxreq, $callback->($dirs, $nondirs) 348=item aio_scandir $path, $maxreq, $callback->($dirs, $nondirs)
338 349
350[EXPERIMENTAL due to internal aio_group use]
351
339Scans a directory (similar to C<aio_readdir>) but additionally tries to 352Scans a directory (similar to C<aio_readdir>) but additionally tries to
340separate the entries of directory C<$path> into two sets of names, ones 353separate the entries of directory C<$path> into two sets of names, ones
341you can recurse into (directories or links to them), and ones you cannot 354you can recurse into (directories or links to them), and ones you cannot
342recurse into (everything else). 355recurse into (everything else).
343 356
344C<aio_scandir> is a composite request that consists of many sub 357C<aio_scandir> is a composite request that creates of many sub requests_
345requests. C<$maxreq> specifies the maximum number of outstanding aio 358C<$maxreq> specifies the maximum number of outstanding aio requests that
346requests that this function generates. If it is C<< <= 0 >>, then a 359this function generates. If it is C<< <= 0 >>, then a suitable default
347suitable default will be chosen (currently 8). 360will be chosen (currently 6).
348 361
349On error, the callback is called without arguments, otherwise it receives 362On error, the callback is called without arguments, otherwise it receives
350two array-refs with path-relative entry names. 363two array-refs with path-relative entry names.
351 364
352Example: 365Example:
389=cut 402=cut
390 403
391sub aio_scandir($$$) { 404sub aio_scandir($$$) {
392 my ($path, $maxreq, $cb) = @_; 405 my ($path, $maxreq, $cb) = @_;
393 406
407 my $grp = aio_group $cb;
408
394 $maxreq = 8 if $maxreq <= 0; 409 $maxreq = 6 if $maxreq <= 0;
395 410
396 # stat once 411 # stat once
397 aio_stat $path, sub { 412 add $grp aio_stat $path, sub {
398 return $cb->() if $_[0]; 413 return $grp->result () if $_[0];
399 my $now = time; 414 my $now = time;
400 my $hash1 = join ":", (stat _)[0,1,3,7,9]; 415 my $hash1 = join ":", (stat _)[0,1,3,7,9];
401 416
402 # read the directory entries 417 # read the directory entries
403 aio_readdir $path, sub { 418 add $grp aio_readdir $path, sub {
404 my $entries = shift 419 my $entries = shift
405 or return $cb->(); 420 or return $grp->result ();
406 421
407 # stat the dir another time 422 # stat the dir another time
408 aio_stat $path, sub { 423 add $grp aio_stat $path, sub {
409 my $hash2 = join ":", (stat _)[0,1,3,7,9]; 424 my $hash2 = join ":", (stat _)[0,1,3,7,9];
410 425
411 my $ndirs; 426 my $ndirs;
412 427
413 # take the slow route if anything looks fishy 428 # take the slow route if anything looks fishy
415 $ndirs = -1; 430 $ndirs = -1;
416 } else { 431 } else {
417 # if nlink == 2, we are finished 432 # if nlink == 2, we are finished
418 # on non-posix-fs's, we rely on nlink < 2 433 # on non-posix-fs's, we rely on nlink < 2
419 $ndirs = (stat _)[3] - 2 434 $ndirs = (stat _)[3] - 2
420 or return $cb->([], $entries); 435 or return $grp->result ([], $entries);
421 } 436 }
422 437
423 # sort into likely dirs and likely nondirs 438 # sort into likely dirs and likely nondirs
424 # dirs == files without ".", short entries first 439 # dirs == files without ".", short entries first
425 $entries = [map $_->[0], 440 $entries = [map $_->[0],
430 my (@dirs, @nondirs); 445 my (@dirs, @nondirs);
431 446
432 my ($statcb, $schedcb); 447 my ($statcb, $schedcb);
433 my $nreq = 0; 448 my $nreq = 0;
434 449
450 my $statgrp = add $grp aio_group;
451
435 $schedcb = sub { 452 $schedcb = sub {
436 if (@$entries) { 453 if (@$entries) {
437 if ($nreq < $maxreq) { 454 if ($nreq < $maxreq) {
438 my $ent = pop @$entries; 455 my $ent = pop @$entries;
439 $nreq++; 456 $nreq++;
440 aio_stat "$path/$ent/.", sub { $statcb->($_[0], $ent) }; 457 add $statgrp aio_stat "$path/$ent/.", sub { $statcb->($_[0], $ent) };
441 } 458 }
442 } elsif (!$nreq) { 459 } elsif (!$nreq) {
443 # finished 460 # finished
461 $statgrp->cancel;
444 undef $statcb; 462 undef $statcb;
445 undef $schedcb; 463 undef $schedcb;
446 $cb->(\@dirs, \@nondirs) if $cb; 464 $grp->result (\@dirs, \@nondirs);
447 undef $cb;
448 } 465 }
449 }; 466 };
450 $statcb = sub { 467 $statcb = sub {
451 my ($status, $entry) = @_; 468 my ($status, $entry) = @_;
452 469
454 $nreq--; 471 $nreq--;
455 push @nondirs, $entry; 472 push @nondirs, $entry;
456 &$schedcb; 473 &$schedcb;
457 } else { 474 } else {
458 # need to check for real directory 475 # need to check for real directory
459 aio_lstat "$path/$entry", sub { 476 add $grp aio_lstat "$path/$entry", sub {
460 $nreq--; 477 $nreq--;
461 478
462 if (-d _) { 479 if (-d _) {
463 push @dirs, $entry; 480 push @dirs, $entry;
464 481
477 494
478 &$schedcb while @$entries && $nreq < $maxreq; 495 &$schedcb while @$entries && $nreq < $maxreq;
479 }; 496 };
480 }; 497 };
481 }; 498 };
499
500 $grp
482} 501}
483 502
484=item aio_fsync $fh, $callback->($status) 503=item aio_fsync $fh, $callback->($status)
485 504
486Asynchronously call fsync on the given filehandle and call the callback 505Asynchronously call fsync on the given filehandle and call the callback
492callback with the fdatasync result code. 511callback with the fdatasync result code.
493 512
494If this call isn't available because your OS lacks it or it couldn't be 513If this call isn't available because your OS lacks it or it couldn't be
495detected, it will be emulated by calling C<fsync> instead. 514detected, it will be emulated by calling C<fsync> instead.
496 515
516=item aio_group $callback->(...)
517
518[EXPERIMENTAL]
519
520This is a very special aio request: Instead of doing something, it is a
521container for other aio requests, which is useful if you want to bundle
522many requests into a single, composite, request.
523
524Returns an object of class L<IO::AIO::GRP>. See its documentation below
525for more info.
526
527Example:
528
529 my $grp = aio_group sub {
530 print "all stats done\n";
531 };
532
533 add $grp
534 (aio_stat ...),
535 (aio_stat ...),
536 ...;
537
538=item IO::AIO::aio_sleep $fractional_seconds, $callback->() *NOT EXPORTED*
539
540Mainly used for debugging and benchmarking, this aio request puts one of
541the request workers to sleep for the given time.
542
543While it is theoretically handy to have simple I/O scheduling requests
544like sleep and file handle readable/writable, the overhead this creates
545is immense, so do not use this function except to put your application
546under artificial I/O pressure.
547
497=back 548=back
498 549
499=head2 IO::AIO::CB CLASS 550=head2 IO::AIO::REQ CLASS
500 551
501All non-aggregate C<aio_*> functions return an object of this class when 552All non-aggregate C<aio_*> functions return an object of this class when
502called in non-void context. 553called in non-void context.
503 554
504A request always moves through the following five states in its lifetime, 555A request always moves through the following five states in its lifetime,
519untouched. That means that requests that currently execute will not be 570untouched. That means that requests that currently execute will not be
520stopped and resources held by the request will not be freed prematurely. 571stopped and resources held by the request will not be freed prematurely.
521 572
522=back 573=back
523 574
575=head2 IO::AIO::GRP CLASS
576
577This class is a subclass of L<IO::AIO::REQ>, so all its methods apply to
578objects of this class, too.
579
580A IO::AIO::GRP object is a special request that can contain multiple other
581aio requests.
582
583You create one by calling the C<aio_group> constructing function with a
584callback that will be called when all contained requests have entered the
585C<done> state:
586
587 my $grp = aio_group sub {
588 print "all requests are done\n";
589 };
590
591You add requests by calling the C<add> method with one or more
592C<IO::AIO::REQ> objects:
593
594 $grp->add (aio_unlink "...");
595
596 add $grp aio_stat "...", sub {
597 $_[0] or return $grp->result ("error");
598
599 # add another request dynamically, if first succeeded
600 add $grp aio_open "...", sub {
601 $grp->result ("ok");
602 };
603 };
604
605This makes it very easy to create composite requests (see the source of
606C<aio_move> for an application) that work and feel like simple requests.
607
608The IO::AIO::GRP objects will be cleaned up during calls to
609C<IO::AIO::poll_cb>, just like any other request.
610
611They can be canceled like any other request. Canceling will cancel not
612only the request itself, but also all requests it contains.
613
614They can also can also be added to other IO::AIO::GRP objects.
615
616You must not add requests to a group from within the group callback (or
617any later time).
618
619Their lifetime, simplified, looks like this: when they are empty, they
620will finish very quickly. If they contain only requests that are in the
621C<done> state, they will also finish. Otherwise they will continue to
622exist.
623
624That means after creating a group you have some time to add requests. And
625in the callbacks of those requests, you can add further requests to the
626group. And only when all those requests have finished will the the group
627itself finish.
628
629=over 4
630
631=item $grp->add (...)
632
633=item add $grp ...
634
635Add one or more requests to the group. Any type of L<IO::AIO::REQ> can
636be added, including other groups, as long as you do not create circular
637dependencies.
638
639Returns all its arguments.
640
641=item $grp->result (...)
642
643Set the result value(s) that will be passed to the group callback when all
644subrequests have finished. By default, no argument will be passed.
645
646=item $grp->set_feeder ($callback->($grp))
647
648[VERY EXPERIMENTAL]
649
650Sets a feeder/generator on this group: every group can have an attached
651generator that generates requests if idle. The idea behind this is that,
652although you could just queue as many requests as you want in a group,
653this might starve other requests for a potentially long time. For
654example, C<aio_scandir> might generate hundreds of thousands C<aio_stat>
655requests, delaying any later requests for a long time.
656
657To avoid this, and allow incremental generation of requests, you can
658instead a group and set a feeder on it that generates those requests. The
659feeder will be called whenever there are few enough (see C<feeder_limit>,
660below) requests active in the group itself and is expected to queue more
661requests.
662
663The feeder can queue as many requests as it likes (i.e. C<add> does not
664impose any limits).
665
666If the feeder does not queue more requests when called, it will be
667automatically removed from the group.
668
669If the feeder limit is C<0>, it will be set to C<2> automatically.
670
671Example:
672
673 # stat all files in @files, but only ever use four aio requests concurrently:
674
675 my $grp = aio_group sub { print "finished\n" };
676 $grp->feeder_limit (4);
677 $grp->set_feeder (sub {
678 my $file = pop @files
679 or return;
680
681 add $grp aio_stat $file, sub { ... };
682 });
683
684=item $grp->feeder_limit ($num)
685
686Sets the feeder limit for the group: The feeder will be called whenever
687the group contains less than this many requests.
688
689Setting the limit to C<0> will pause the feeding process.
690
691=back
692
524=head2 SUPPORT FUNCTIONS 693=head2 SUPPORT FUNCTIONS
525 694
526=over 4 695=over 4
527 696
528=item $fileno = IO::AIO::poll_fileno 697=item $fileno = IO::AIO::poll_fileno
583 IO::AIO::poll_wait, IO::AIO::poll_cb 752 IO::AIO::poll_wait, IO::AIO::poll_cb
584 if IO::AIO::nreqs; 753 if IO::AIO::nreqs;
585 754
586=item IO::AIO::min_parallel $nthreads 755=item IO::AIO::min_parallel $nthreads
587 756
588Set the minimum number of AIO threads to C<$nthreads>. The current default 757Set the minimum number of AIO threads to C<$nthreads>. The current
589is C<4>, which means four asynchronous operations can be done at one time 758default is C<8>, which means eight asynchronous operations can execute
590(the number of outstanding operations, however, is unlimited). 759concurrently at any one time (the number of outstanding requests,
760however, is unlimited).
591 761
592IO::AIO starts threads only on demand, when an AIO request is queued and 762IO::AIO starts threads only on demand, when an AIO request is queued and
593no free thread exists. 763no free thread exists.
594 764
595It is recommended to keep the number of threads low, as some Linux 765It is recommended to keep the number of threads relatively low, as some
596kernel versions will scale negatively with the number of threads (higher 766Linux kernel versions will scale negatively with the number of threads
597parallelity => MUCH higher latency). With current Linux 2.6 versions, 4-32 767(higher parallelity => MUCH higher latency). With current Linux 2.6
598threads should be fine. 768versions, 4-32 threads should be fine.
599 769
600Under most circumstances you don't need to call this function, as the 770Under most circumstances you don't need to call this function, as the
601module selects a default that is suitable for low to moderate load. 771module selects a default that is suitable for low to moderate load.
602 772
603=item IO::AIO::max_parallel $nthreads 773=item IO::AIO::max_parallel $nthreads
644 or return undef; 814 or return undef;
645 815
646 *$sym 816 *$sym
647} 817}
648 818
649min_parallel 4; 819min_parallel 8;
650 820
651END { 821END {
652 max_parallel 0; 822 max_parallel 0;
653} 823}
654 824
668 838
669In short: the parent will, after a short pause, continue as if fork had 839In short: the parent will, after a short pause, continue as if fork had
670not been called, while the child will act as if IO::AIO has not been used 840not been called, while the child will act as if IO::AIO has not been used
671yet. 841yet.
672 842
843=head2 MEMORY USAGE
844
845Each aio request uses - depending on your architecture - around 128 bytes
846of memory. In addition, stat requests need a stat buffer (possibly a few
847hundred bytes). Perl scalars and other data passed into aio requests will
848also be locked.
849
850This is now awfully much, so queuing lots of requests is not usually a
851problem.
852
853Each thread needs a stack area which is usually around 16k, sometimes much
854larger, depending on the OS.
855
673=head1 SEE ALSO 856=head1 SEE ALSO
674 857
675L<Coro>, L<Linux::AIO> (obsolete). 858L<Coro>, L<Linux::AIO> (obsolete).
676 859
677=head1 AUTHOR 860=head1 AUTHOR

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines