… | |
… | |
79 | our $VERSION = '2.0'; |
79 | our $VERSION = '2.0'; |
80 | |
80 | |
81 | our @EXPORT = qw(aio_sendfile aio_read aio_write aio_open aio_close aio_stat |
81 | our @EXPORT = qw(aio_sendfile aio_read aio_write aio_open aio_close aio_stat |
82 | aio_lstat aio_unlink aio_rmdir aio_readdir aio_scandir aio_symlink |
82 | aio_lstat aio_unlink aio_rmdir aio_readdir aio_scandir aio_symlink |
83 | aio_fsync aio_fdatasync aio_readahead aio_rename aio_link aio_move |
83 | aio_fsync aio_fdatasync aio_readahead aio_rename aio_link aio_move |
84 | aio_group); |
84 | aio_group aio_nop); |
85 | our @EXPORT_OK = qw(poll_fileno poll_cb min_parallel max_parallel max_outstanding nreqs); |
85 | our @EXPORT_OK = qw(poll_fileno poll_cb min_parallel max_parallel max_outstanding nreqs); |
86 | |
86 | |
87 | @IO::AIO::GRP::ISA = 'IO::AIO::REQ'; |
87 | @IO::AIO::GRP::ISA = 'IO::AIO::REQ'; |
88 | |
88 | |
89 | require XSLoader; |
89 | require XSLoader; |
… | |
… | |
352 | Scans a directory (similar to C<aio_readdir>) but additionally tries to |
352 | Scans a directory (similar to C<aio_readdir>) but additionally tries to |
353 | separate the entries of directory C<$path> into two sets of names, ones |
353 | separate the entries of directory C<$path> into two sets of names, ones |
354 | you can recurse into (directories or links to them), and ones you cannot |
354 | you can recurse into (directories or links to them), and ones you cannot |
355 | recurse into (everything else). |
355 | recurse into (everything else). |
356 | |
356 | |
357 | C<aio_scandir> is a composite request that consists of many sub |
357 | C<aio_scandir> is a composite request that creates of many sub requests_ |
358 | requests. C<$maxreq> specifies the maximum number of outstanding aio |
358 | C<$maxreq> specifies the maximum number of outstanding aio requests that |
359 | requests that this function generates. If it is C<< <= 0 >>, then a |
359 | this function generates. If it is C<< <= 0 >>, then a suitable default |
360 | suitable default will be chosen (currently 8). |
360 | will be chosen (currently 6). |
361 | |
361 | |
362 | On error, the callback is called without arguments, otherwise it receives |
362 | On error, the callback is called without arguments, otherwise it receives |
363 | two array-refs with path-relative entry names. |
363 | two array-refs with path-relative entry names. |
364 | |
364 | |
365 | Example: |
365 | Example: |
… | |
… | |
404 | sub aio_scandir($$$) { |
404 | sub aio_scandir($$$) { |
405 | my ($path, $maxreq, $cb) = @_; |
405 | my ($path, $maxreq, $cb) = @_; |
406 | |
406 | |
407 | my $grp = aio_group $cb; |
407 | my $grp = aio_group $cb; |
408 | |
408 | |
409 | $maxreq = 8 if $maxreq <= 0; |
409 | $maxreq = 6 if $maxreq <= 0; |
410 | |
410 | |
411 | # stat once |
411 | # stat once |
412 | add $grp aio_stat $path, sub { |
412 | add $grp aio_stat $path, sub { |
413 | return $grp->result () if $_[0]; |
413 | return $grp->result () if $_[0]; |
414 | my $now = time; |
414 | my $now = time; |
… | |
… | |
445 | my (@dirs, @nondirs); |
445 | my (@dirs, @nondirs); |
446 | |
446 | |
447 | my ($statcb, $schedcb); |
447 | my ($statcb, $schedcb); |
448 | my $nreq = 0; |
448 | my $nreq = 0; |
449 | |
449 | |
|
|
450 | my $statgrp = add $grp aio_group; |
|
|
451 | |
450 | $schedcb = sub { |
452 | $schedcb = sub { |
451 | if (@$entries) { |
453 | if (@$entries) { |
452 | if ($nreq < $maxreq) { |
454 | if ($nreq < $maxreq) { |
453 | my $ent = pop @$entries; |
455 | my $ent = pop @$entries; |
454 | $nreq++; |
456 | $nreq++; |
455 | add $grp aio_stat "$path/$ent/.", sub { $statcb->($_[0], $ent) }; |
457 | add $statgrp aio_stat "$path/$ent/.", sub { $statcb->($_[0], $ent) }; |
456 | } |
458 | } |
457 | } elsif (!$nreq) { |
459 | } elsif (!$nreq) { |
458 | # finished |
460 | # finished |
|
|
461 | $statgrp->cancel; |
459 | undef $statcb; |
462 | undef $statcb; |
460 | undef $schedcb; |
463 | undef $schedcb; |
461 | $grp->result (\@dirs, \@nondirs) if $cb; |
464 | $grp->result (\@dirs, \@nondirs); |
462 | undef $cb; |
|
|
463 | } |
465 | } |
464 | }; |
466 | }; |
465 | $statcb = sub { |
467 | $statcb = sub { |
466 | my ($status, $entry) = @_; |
468 | my ($status, $entry) = @_; |
467 | |
469 | |
… | |
… | |
531 | add $grp |
533 | add $grp |
532 | (aio_stat ...), |
534 | (aio_stat ...), |
533 | (aio_stat ...), |
535 | (aio_stat ...), |
534 | ...; |
536 | ...; |
535 | |
537 | |
|
|
538 | =item aio_nop $callback->() |
|
|
539 | |
|
|
540 | This is a special request - it does nothing in itself and is only used for |
|
|
541 | side effects, such as when you want to add a dummy request to a group so |
|
|
542 | that finishing the requests in the group depends on executing the given |
|
|
543 | code. |
|
|
544 | |
536 | =item IO::AIO::aio_sleep $fractional_seconds, $callback->() *NOT EXPORTED* |
545 | =item IO::AIO::aio_sleep $fractional_seconds, $callback->() *NOT EXPORTED* |
537 | |
546 | |
538 | Mainly used for debugging and benchmarking, this aio request puts one of |
547 | Mainly used for debugging and benchmarking, this aio request puts one of |
539 | the request workers to sleep for the given time. |
548 | the request workers to sleep for the given time. |
540 | |
549 | |
… | |
… | |
601 | }; |
610 | }; |
602 | |
611 | |
603 | This makes it very easy to create composite requests (see the source of |
612 | This makes it very easy to create composite requests (see the source of |
604 | C<aio_move> for an application) that work and feel like simple requests. |
613 | C<aio_move> for an application) that work and feel like simple requests. |
605 | |
614 | |
|
|
615 | =over 4 |
|
|
616 | |
606 | The IO::AIO::GRP objects will be cleaned up during calls to |
617 | =item * The IO::AIO::GRP objects will be cleaned up during calls to |
607 | C<IO::AIO::poll_cb>, just like any other request. |
618 | C<IO::AIO::poll_cb>, just like any other request. |
608 | |
619 | |
609 | They can be canceled like any other request. Canceling will cancel not |
620 | =item * They can be canceled like any other request. Canceling will cancel not |
610 | only the request itself, but also all requests it contains. |
621 | only the request itself, but also all requests it contains. |
611 | |
622 | |
612 | They can also can also be added to other IO::AIO::GRP objects. |
623 | =item * They can also can also be added to other IO::AIO::GRP objects. |
|
|
624 | |
|
|
625 | =item * You must not add requests to a group from within the group callback (or |
|
|
626 | any later time). |
|
|
627 | |
|
|
628 | =item * This does not harmonise well with C<max_outstanding>, so best do |
|
|
629 | not combine C<aio_group> with it. Groups and feeders are recommended for |
|
|
630 | this kind of concurrency-limiting. |
|
|
631 | |
|
|
632 | =back |
613 | |
633 | |
614 | Their lifetime, simplified, looks like this: when they are empty, they |
634 | Their lifetime, simplified, looks like this: when they are empty, they |
615 | will finish very quickly. If they contain only requests that are in the |
635 | will finish very quickly. If they contain only requests that are in the |
616 | C<done> state, they will also finish. Otherwise they will continue to |
636 | C<done> state, they will also finish. Otherwise they will continue to |
617 | exist. |
637 | exist. |
… | |
… | |
636 | =item $grp->result (...) |
656 | =item $grp->result (...) |
637 | |
657 | |
638 | Set the result value(s) that will be passed to the group callback when all |
658 | Set the result value(s) that will be passed to the group callback when all |
639 | subrequests have finished. By default, no argument will be passed. |
659 | subrequests have finished. By default, no argument will be passed. |
640 | |
660 | |
|
|
661 | =item $grp->set_feeder ($callback->($grp)) |
|
|
662 | |
|
|
663 | [VERY EXPERIMENTAL] |
|
|
664 | |
|
|
665 | Sets a feeder/generator on this group: every group can have an attached |
|
|
666 | generator that generates requests if idle. The idea behind this is that, |
|
|
667 | although you could just queue as many requests as you want in a group, |
|
|
668 | this might starve other requests for a potentially long time. For |
|
|
669 | example, C<aio_scandir> might generate hundreds of thousands C<aio_stat> |
|
|
670 | requests, delaying any later requests for a long time. |
|
|
671 | |
|
|
672 | To avoid this, and allow incremental generation of requests, you can |
|
|
673 | instead a group and set a feeder on it that generates those requests. The |
|
|
674 | feeder will be called whenever there are few enough (see C<feeder_limit>, |
|
|
675 | below) requests active in the group itself and is expected to queue more |
|
|
676 | requests. |
|
|
677 | |
|
|
678 | The feeder can queue as many requests as it likes (i.e. C<add> does not |
|
|
679 | impose any limits). |
|
|
680 | |
|
|
681 | If the feeder does not queue more requests when called, it will be |
|
|
682 | automatically removed from the group. |
|
|
683 | |
|
|
684 | If the feeder limit is C<0>, it will be set to C<2> automatically. |
|
|
685 | |
|
|
686 | Example: |
|
|
687 | |
|
|
688 | # stat all files in @files, but only ever use four aio requests concurrently: |
|
|
689 | |
|
|
690 | my $grp = aio_group sub { print "finished\n" }; |
|
|
691 | $grp->feeder_limit (4); |
|
|
692 | $grp->set_feeder (sub { |
|
|
693 | my $file = pop @files |
|
|
694 | or return; |
|
|
695 | |
|
|
696 | add $grp aio_stat $file, sub { ... }; |
|
|
697 | }); |
|
|
698 | |
|
|
699 | =item $grp->feeder_limit ($num) |
|
|
700 | |
|
|
701 | Sets the feeder limit for the group: The feeder will be called whenever |
|
|
702 | the group contains less than this many requests. |
|
|
703 | |
|
|
704 | Setting the limit to C<0> will pause the feeding process. |
|
|
705 | |
641 | =back |
706 | =back |
642 | |
707 | |
643 | =head2 SUPPORT FUNCTIONS |
708 | =head2 SUPPORT FUNCTIONS |
644 | |
709 | |
645 | =over 4 |
710 | =over 4 |
… | |
… | |
702 | IO::AIO::poll_wait, IO::AIO::poll_cb |
767 | IO::AIO::poll_wait, IO::AIO::poll_cb |
703 | if IO::AIO::nreqs; |
768 | if IO::AIO::nreqs; |
704 | |
769 | |
705 | =item IO::AIO::min_parallel $nthreads |
770 | =item IO::AIO::min_parallel $nthreads |
706 | |
771 | |
707 | Set the minimum number of AIO threads to C<$nthreads>. The current default |
772 | Set the minimum number of AIO threads to C<$nthreads>. The current |
708 | is C<4>, which means four asynchronous operations can be done at one time |
773 | default is C<8>, which means eight asynchronous operations can execute |
709 | (the number of outstanding operations, however, is unlimited). |
774 | concurrently at any one time (the number of outstanding requests, |
|
|
775 | however, is unlimited). |
710 | |
776 | |
711 | IO::AIO starts threads only on demand, when an AIO request is queued and |
777 | IO::AIO starts threads only on demand, when an AIO request is queued and |
712 | no free thread exists. |
778 | no free thread exists. |
713 | |
779 | |
714 | It is recommended to keep the number of threads low, as some Linux |
780 | It is recommended to keep the number of threads relatively low, as some |
715 | kernel versions will scale negatively with the number of threads (higher |
781 | Linux kernel versions will scale negatively with the number of threads |
716 | parallelity => MUCH higher latency). With current Linux 2.6 versions, 4-32 |
782 | (higher parallelity => MUCH higher latency). With current Linux 2.6 |
717 | threads should be fine. |
783 | versions, 4-32 threads should be fine. |
718 | |
784 | |
719 | Under most circumstances you don't need to call this function, as the |
785 | Under most circumstances you don't need to call this function, as the |
720 | module selects a default that is suitable for low to moderate load. |
786 | module selects a default that is suitable for low to moderate load. |
721 | |
787 | |
722 | =item IO::AIO::max_parallel $nthreads |
788 | =item IO::AIO::max_parallel $nthreads |
… | |
… | |
733 | |
799 | |
734 | Under normal circumstances you don't need to call this function. |
800 | Under normal circumstances you don't need to call this function. |
735 | |
801 | |
736 | =item $oldnreqs = IO::AIO::max_outstanding $nreqs |
802 | =item $oldnreqs = IO::AIO::max_outstanding $nreqs |
737 | |
803 | |
|
|
804 | [DEPRECATED] |
|
|
805 | |
738 | Sets the maximum number of outstanding requests to C<$nreqs>. If you |
806 | Sets the maximum number of outstanding requests to C<$nreqs>. If you |
739 | try to queue up more than this number of requests, the caller will block until |
807 | try to queue up more than this number of requests, the caller will block until |
740 | some requests have been handled. |
808 | some requests have been handled. |
741 | |
809 | |
742 | The default is very large, so normally there is no practical limit. If you |
810 | The default is very large, so normally there is no practical limit. If you |
743 | queue up many requests in a loop it often improves speed if you set |
811 | queue up many requests in a loop it often improves speed if you set |
744 | this to a relatively low number, such as C<100>. |
812 | this to a relatively low number, such as C<100>. |
|
|
813 | |
|
|
814 | This function does not work well together with C<aio_group>'s, and their |
|
|
815 | feeder interface is better suited to limiting concurrency, so do not use |
|
|
816 | this function. |
745 | |
817 | |
746 | Under normal circumstances you don't need to call this function. |
818 | Under normal circumstances you don't need to call this function. |
747 | |
819 | |
748 | =back |
820 | =back |
749 | |
821 | |
… | |
… | |
763 | or return undef; |
835 | or return undef; |
764 | |
836 | |
765 | *$sym |
837 | *$sym |
766 | } |
838 | } |
767 | |
839 | |
768 | min_parallel 4; |
840 | min_parallel 8; |
769 | |
841 | |
770 | END { |
842 | END { |
771 | max_parallel 0; |
843 | max_parallel 0; |
772 | } |
844 | } |
773 | |
845 | |
… | |
… | |
787 | |
859 | |
788 | In short: the parent will, after a short pause, continue as if fork had |
860 | In short: the parent will, after a short pause, continue as if fork had |
789 | not been called, while the child will act as if IO::AIO has not been used |
861 | not been called, while the child will act as if IO::AIO has not been used |
790 | yet. |
862 | yet. |
791 | |
863 | |
|
|
864 | =head2 MEMORY USAGE |
|
|
865 | |
|
|
866 | Each aio request uses - depending on your architecture - around 128 bytes |
|
|
867 | of memory. In addition, stat requests need a stat buffer (possibly a few |
|
|
868 | hundred bytes). Perl scalars and other data passed into aio requests will |
|
|
869 | also be locked. |
|
|
870 | |
|
|
871 | This is now awfully much, so queuing lots of requests is not usually a |
|
|
872 | problem. |
|
|
873 | |
|
|
874 | Each thread needs a stack area which is usually around 16k, sometimes much |
|
|
875 | larger, depending on the OS. |
|
|
876 | |
792 | =head1 SEE ALSO |
877 | =head1 SEE ALSO |
793 | |
878 | |
794 | L<Coro>, L<Linux::AIO> (obsolete). |
879 | L<Coro>, L<Linux::AIO> (obsolete). |
795 | |
880 | |
796 | =head1 AUTHOR |
881 | =head1 AUTHOR |