… | |
… | |
168 | use common::sense; |
168 | use common::sense; |
169 | |
169 | |
170 | use base 'Exporter'; |
170 | use base 'Exporter'; |
171 | |
171 | |
172 | BEGIN { |
172 | BEGIN { |
173 | our $VERSION = '3.72'; |
173 | our $VERSION = '3.93'; |
174 | |
174 | |
175 | our @AIO_REQ = qw(aio_sendfile aio_read aio_write aio_open aio_close |
175 | our @AIO_REQ = qw(aio_sendfile aio_read aio_write aio_open aio_close |
176 | aio_stat aio_lstat aio_unlink aio_rmdir aio_readdir aio_readdirx |
176 | aio_stat aio_lstat aio_unlink aio_rmdir aio_readdir aio_readdirx |
177 | aio_scandir aio_symlink aio_readlink aio_sync aio_fsync |
177 | aio_scandir aio_symlink aio_readlink aio_realpath aio_sync aio_fsync |
178 | aio_fdatasync aio_sync_file_range aio_pathsync aio_readahead |
178 | aio_fdatasync aio_sync_file_range aio_fallocate |
|
|
179 | aio_pathsync aio_readahead |
179 | aio_rename aio_link aio_move aio_copy aio_group |
180 | aio_rename aio_link aio_move aio_copy aio_group |
180 | aio_nop aio_mknod aio_load aio_rmtree aio_mkdir aio_chown |
181 | aio_nop aio_mknod aio_load aio_rmtree aio_mkdir aio_chown |
181 | aio_chmod aio_utime aio_truncate |
182 | aio_chmod aio_utime aio_truncate |
182 | aio_msync aio_mtouch aio_mlock aio_mlockall |
183 | aio_msync aio_mtouch aio_mlock aio_mlockall |
183 | aio_statvfs); |
184 | aio_statvfs); |
… | |
… | |
222 | aio_unlink $pathname, $callback->($status) |
223 | aio_unlink $pathname, $callback->($status) |
223 | aio_mknod $path, $mode, $dev, $callback->($status) |
224 | aio_mknod $path, $mode, $dev, $callback->($status) |
224 | aio_link $srcpath, $dstpath, $callback->($status) |
225 | aio_link $srcpath, $dstpath, $callback->($status) |
225 | aio_symlink $srcpath, $dstpath, $callback->($status) |
226 | aio_symlink $srcpath, $dstpath, $callback->($status) |
226 | aio_readlink $path, $callback->($link) |
227 | aio_readlink $path, $callback->($link) |
|
|
228 | aio_realpath $path, $callback->($link) |
227 | aio_rename $srcpath, $dstpath, $callback->($status) |
229 | aio_rename $srcpath, $dstpath, $callback->($status) |
228 | aio_mkdir $pathname, $mode, $callback->($status) |
230 | aio_mkdir $pathname, $mode, $callback->($status) |
229 | aio_rmdir $pathname, $callback->($status) |
231 | aio_rmdir $pathname, $callback->($status) |
230 | aio_readdir $pathname, $callback->($entries) |
232 | aio_readdir $pathname, $callback->($entries) |
231 | aio_readdirx $pathname, $flags, $callback->($entries, $flags) |
233 | aio_readdirx $pathname, $flags, $callback->($entries, $flags) |
… | |
… | |
368 | } else { |
370 | } else { |
369 | die "open failed: $!\n"; |
371 | die "open failed: $!\n"; |
370 | } |
372 | } |
371 | }; |
373 | }; |
372 | |
374 | |
|
|
375 | In addition to all the common open modes/flags (C<O_RDONLY>, C<O_WRONLY>, |
|
|
376 | C<O_RDWR>, C<O_CREAT>, C<O_TRUNC>, C<O_EXCL> and C<O_APPEND>), the |
|
|
377 | following POSIX and non-POSIX constants are available (missing ones on |
|
|
378 | your system are, as usual, C<0>): |
|
|
379 | |
|
|
380 | C<O_ASYNC>, C<O_DIRECT>, C<O_NOATIME>, C<O_CLOEXEC>, C<O_NOCTTY>, C<O_NOFOLLOW>, |
|
|
381 | C<O_NONBLOCK>, C<O_EXEC>, C<O_SEARCH>, C<O_DIRECTORY>, C<O_DSYNC>, |
|
|
382 | C<O_RSYNC>, C<O_SYNC> and C<O_TTY_INIT>. |
|
|
383 | |
373 | |
384 | |
374 | =item aio_close $fh, $callback->($status) |
385 | =item aio_close $fh, $callback->($status) |
375 | |
386 | |
376 | Asynchronously close a file and call the callback with the result |
387 | Asynchronously close a file and call the callback with the result |
377 | code. |
388 | code. |
… | |
… | |
427 | |
438 | |
428 | Tries to copy C<$length> bytes from C<$in_fh> to C<$out_fh>. It starts |
439 | Tries to copy C<$length> bytes from C<$in_fh> to C<$out_fh>. It starts |
429 | reading at byte offset C<$in_offset>, and starts writing at the current |
440 | reading at byte offset C<$in_offset>, and starts writing at the current |
430 | file offset of C<$out_fh>. Because of that, it is not safe to issue more |
441 | file offset of C<$out_fh>. Because of that, it is not safe to issue more |
431 | than one C<aio_sendfile> per C<$out_fh>, as they will interfere with each |
442 | than one C<aio_sendfile> per C<$out_fh>, as they will interfere with each |
432 | other. |
443 | other. The same C<$in_fh> works fine though, as this function does not |
|
|
444 | move or use the file offset of C<$in_fh>. |
433 | |
445 | |
434 | Please note that C<aio_sendfile> can read more bytes from C<$in_fh> than |
446 | Please note that C<aio_sendfile> can read more bytes from C<$in_fh> than |
435 | are written, and there is no way to find out how many bytes have been read |
447 | are written, and there is no way to find out how many more bytes have been |
436 | from C<aio_sendfile> alone, as C<aio_sendfile> only provides the number of |
448 | read from C<aio_sendfile> alone, as C<aio_sendfile> only provides the |
437 | bytes written to C<$out_fh>. Only if the result value equals C<$length> |
449 | number of bytes written to C<$out_fh>. Only if the result value equals |
438 | one can assume that C<$length> bytes have been read. |
450 | C<$length> one can assume that C<$length> bytes have been read. |
439 | |
451 | |
440 | Unlike with other C<aio_> functions, it makes a lot of sense to use |
452 | Unlike with other C<aio_> functions, it makes a lot of sense to use |
441 | C<aio_sendfile> on non-blocking sockets, as long as one end (typically |
453 | C<aio_sendfile> on non-blocking sockets, as long as one end (typically |
442 | the C<$in_fh>) is a file - the file I/O will then be asynchronous, while |
454 | the C<$in_fh>) is a file - the file I/O will then be asynchronous, while |
443 | the socket I/O will be non-blocking. Note, however, that you can run into |
455 | the socket I/O will be non-blocking. Note, however, that you can run |
444 | a trap where C<aio_sendfile> reads some data with readahead, then fails |
456 | into a trap where C<aio_sendfile> reads some data with readahead, then |
445 | to write all data, and when the socket is ready the next time, the data |
457 | fails to write all data, and when the socket is ready the next time, the |
446 | in the cache is already lost, forcing C<aio_sendfile> to again hit the |
458 | data in the cache is already lost, forcing C<aio_sendfile> to again hit |
447 | disk. Explicit C<aio_read> + C<aio_write> let's you control resource usage |
459 | the disk. Explicit C<aio_read> + C<aio_write> let's you better control |
448 | much better. |
460 | resource usage. |
449 | |
461 | |
450 | This call tries to make use of a native C<sendfile> syscall to provide |
462 | This call tries to make use of a native C<sendfile>-like syscall to |
451 | zero-copy operation. For this to work, C<$out_fh> should refer to a |
463 | provide zero-copy operation. For this to work, C<$out_fh> should refer to |
452 | socket, and C<$in_fh> should refer to an mmap'able file. |
464 | a socket, and C<$in_fh> should refer to an mmap'able file. |
453 | |
465 | |
454 | If a native sendfile cannot be found or it fails with C<ENOSYS>, |
466 | If a native sendfile cannot be found or it fails with C<ENOSYS>, |
455 | C<ENOTSUP>, C<EOPNOTSUPP>, C<EAFNOSUPPORT>, C<EPROTOTYPE> or C<ENOTSOCK>, |
467 | C<EINVAL>, C<ENOTSUP>, C<EOPNOTSUPP>, C<EAFNOSUPPORT>, C<EPROTOTYPE> or |
456 | it will be emulated, so you can call C<aio_sendfile> on any type of |
468 | C<ENOTSOCK>, it will be emulated, so you can call C<aio_sendfile> on any |
457 | filehandle regardless of the limitations of the operating system. |
469 | type of filehandle regardless of the limitations of the operating system. |
|
|
470 | |
|
|
471 | As native sendfile syscalls (as practically any non-POSIX interface hacked |
|
|
472 | together in a hurry to improve benchmark numbers) tend to be rather buggy |
|
|
473 | on many systems, this implementation tries to work around some known bugs |
|
|
474 | in Linux and FreeBSD kernels (probably others, too), but that might fail, |
|
|
475 | so you really really should check the return value of C<aio_sendfile> - |
|
|
476 | fewre bytes than expected might have been transferred. |
458 | |
477 | |
459 | |
478 | |
460 | =item aio_readahead $fh,$offset,$length, $callback->($retval) |
479 | =item aio_readahead $fh,$offset,$length, $callback->($retval) |
461 | |
480 | |
462 | C<aio_readahead> populates the page cache with data from a file so that |
481 | C<aio_readahead> populates the page cache with data from a file so that |
… | |
… | |
626 | Asynchronously read the symlink specified by C<$path> and pass it to |
645 | Asynchronously read the symlink specified by C<$path> and pass it to |
627 | the callback. If an error occurs, nothing or undef gets passed to the |
646 | the callback. If an error occurs, nothing or undef gets passed to the |
628 | callback. |
647 | callback. |
629 | |
648 | |
630 | |
649 | |
|
|
650 | =item aio_realpath $path, $callback->($path) |
|
|
651 | |
|
|
652 | Asynchronously make the path absolute and resolve any symlinks in |
|
|
653 | C<$path>. The resulting path only consists of directories (Same as |
|
|
654 | L<Cwd::realpath>). |
|
|
655 | |
|
|
656 | This request can be used to get the absolute path of the current working |
|
|
657 | directory by passing it a path of F<.> (a single dot). |
|
|
658 | |
|
|
659 | |
631 | =item aio_rename $srcpath, $dstpath, $callback->($status) |
660 | =item aio_rename $srcpath, $dstpath, $callback->($status) |
632 | |
661 | |
633 | Asynchronously rename the object at C<$srcpath> to C<$dstpath>, just as |
662 | Asynchronously rename the object at C<$srcpath> to C<$dstpath>, just as |
634 | rename(2) and call the callback with the result code. |
663 | rename(2) and call the callback with the result code. |
635 | |
664 | |
… | |
… | |
668 | |
697 | |
669 | =over 4 |
698 | =over 4 |
670 | |
699 | |
671 | =item IO::AIO::READDIR_DENTS |
700 | =item IO::AIO::READDIR_DENTS |
672 | |
701 | |
673 | When this flag is off, then the callback gets an arrayref with of names |
702 | When this flag is off, then the callback gets an arrayref consisting of |
674 | only (as with C<aio_readdir>), otherwise it gets an arrayref with |
703 | names only (as with C<aio_readdir>), otherwise it gets an arrayref with |
675 | C<[$name, $type, $inode]> arrayrefs, each describing a single directory |
704 | C<[$name, $type, $inode]> arrayrefs, each describing a single directory |
676 | entry in more detail. |
705 | entry in more detail. |
677 | |
706 | |
678 | C<$name> is the name of the entry. |
707 | C<$name> is the name of the entry. |
679 | |
708 | |
… | |
… | |
692 | systems that do not deliver the inode information. |
721 | systems that do not deliver the inode information. |
693 | |
722 | |
694 | =item IO::AIO::READDIR_DIRS_FIRST |
723 | =item IO::AIO::READDIR_DIRS_FIRST |
695 | |
724 | |
696 | When this flag is set, then the names will be returned in an order where |
725 | When this flag is set, then the names will be returned in an order where |
697 | likely directories come first. This is useful when you need to quickly |
726 | likely directories come first, in optimal stat order. This is useful when |
698 | find directories, or you want to find all directories while avoiding to |
727 | you need to quickly find directories, or you want to find all directories |
699 | stat() each entry. |
728 | while avoiding to stat() each entry. |
700 | |
729 | |
701 | If the system returns type information in readdir, then this is used |
730 | If the system returns type information in readdir, then this is used |
702 | to find directories directly. Otherwise, likely directories are files |
731 | to find directories directly. Otherwise, likely directories are names |
703 | beginning with ".", or otherwise files with no dots, of which files with |
732 | beginning with ".", or otherwise names with no dots, of which names with |
704 | short names are tried first. |
733 | short names are tried first. |
705 | |
734 | |
706 | =item IO::AIO::READDIR_STAT_ORDER |
735 | =item IO::AIO::READDIR_STAT_ORDER |
707 | |
736 | |
708 | When this flag is set, then the names will be returned in an order |
737 | When this flag is set, then the names will be returned in an order |
… | |
… | |
853 | if ($_[0] && $! == EXDEV) { |
882 | if ($_[0] && $! == EXDEV) { |
854 | aioreq_pri $pri; |
883 | aioreq_pri $pri; |
855 | add $grp aio_copy $src, $dst, sub { |
884 | add $grp aio_copy $src, $dst, sub { |
856 | $grp->result ($_[0]); |
885 | $grp->result ($_[0]); |
857 | |
886 | |
858 | if (!$_[0]) { |
887 | unless ($_[0]) { |
859 | aioreq_pri $pri; |
888 | aioreq_pri $pri; |
860 | add $grp aio_unlink $src; |
889 | add $grp aio_unlink $src; |
861 | } |
890 | } |
862 | }; |
891 | }; |
863 | } else { |
892 | } else { |
… | |
… | |
1406 | |
1435 | |
1407 | See C<poll_cb> for an example. |
1436 | See C<poll_cb> for an example. |
1408 | |
1437 | |
1409 | =item IO::AIO::poll_cb |
1438 | =item IO::AIO::poll_cb |
1410 | |
1439 | |
1411 | Process some outstanding events on the result pipe. You have to call this |
1440 | Process some outstanding events on the result pipe. You have to call |
1412 | regularly. Returns C<0> if all events could be processed, or C<-1> if it |
1441 | this regularly. Returns C<0> if all events could be processed (or there |
1413 | returned earlier for whatever reason. Returns immediately when no events |
1442 | were no events to process), or C<-1> if it returned earlier for whatever |
1414 | are outstanding. The amount of events processed depends on the settings of |
1443 | reason. Returns immediately when no events are outstanding. The amount of |
1415 | C<IO::AIO::max_poll_req> and C<IO::AIO::max_poll_time>. |
1444 | events processed depends on the settings of C<IO::AIO::max_poll_req> and |
|
|
1445 | C<IO::AIO::max_poll_time>. |
1416 | |
1446 | |
1417 | If not all requests were processed for whatever reason, the filehandle |
1447 | If not all requests were processed for whatever reason, the filehandle |
1418 | will still be ready when C<poll_cb> returns, so normally you don't have to |
1448 | will still be ready when C<poll_cb> returns, so normally you don't have to |
1419 | do anything special to have it called later. |
1449 | do anything special to have it called later. |
|
|
1450 | |
|
|
1451 | Apart from calling C<IO::AIO::poll_cb> when the event filehandle becomes |
|
|
1452 | ready, it can be beneficial to call this function from loops which submit |
|
|
1453 | a lot of requests, to make sure the results get processed when they become |
|
|
1454 | available and not just when the loop is finished and the event loop takes |
|
|
1455 | over again. This function returns very fast when there are no outstanding |
|
|
1456 | requests. |
1420 | |
1457 | |
1421 | Example: Install an Event watcher that automatically calls |
1458 | Example: Install an Event watcher that automatically calls |
1422 | IO::AIO::poll_cb with high priority (more examples can be found in the |
1459 | IO::AIO::poll_cb with high priority (more examples can be found in the |
1423 | SYNOPSIS section, at the top of this document): |
1460 | SYNOPSIS section, at the top of this document): |
1424 | |
1461 | |
… | |
… | |
1547 | Sets the minimum idle timeout (default 10) after which worker threads are |
1584 | Sets the minimum idle timeout (default 10) after which worker threads are |
1548 | allowed to exit. SEe C<IO::AIO::max_idle>. |
1585 | allowed to exit. SEe C<IO::AIO::max_idle>. |
1549 | |
1586 | |
1550 | =item IO::AIO::max_outstanding $maxreqs |
1587 | =item IO::AIO::max_outstanding $maxreqs |
1551 | |
1588 | |
|
|
1589 | Sets the maximum number of outstanding requests to C<$nreqs>. If |
|
|
1590 | you do queue up more than this number of requests, the next call to |
|
|
1591 | C<IO::AIO::poll_cb> (and other functions calling C<poll_cb>, such as |
|
|
1592 | C<IO::AIO::flush> or C<IO::AIO::poll>) will block until the limit is no |
|
|
1593 | longer exceeded. |
|
|
1594 | |
|
|
1595 | In other words, this setting does not enforce a queue limit, but can be |
|
|
1596 | used to make poll functions block if the limit is exceeded. |
|
|
1597 | |
1552 | This is a very bad function to use in interactive programs because it |
1598 | This is a very bad function to use in interactive programs because it |
1553 | blocks, and a bad way to reduce concurrency because it is inexact: Better |
1599 | blocks, and a bad way to reduce concurrency because it is inexact: Better |
1554 | use an C<aio_group> together with a feed callback. |
1600 | use an C<aio_group> together with a feed callback. |
1555 | |
1601 | |
1556 | Sets the maximum number of outstanding requests to C<$nreqs>. If you |
1602 | It's main use is in scripts without an event loop - when you want to stat |
1557 | do queue up more than this number of requests, the next call to the |
1603 | a lot of files, you can write somehting like this: |
1558 | C<poll_cb> (and C<poll_some> and other functions calling C<poll_cb>) |
|
|
1559 | function will block until the limit is no longer exceeded. |
|
|
1560 | |
1604 | |
1561 | The default value is very large, so there is no practical limit on the |
1605 | IO::AIO::max_outstanding 32; |
1562 | number of outstanding requests. |
|
|
1563 | |
1606 | |
1564 | You can still queue as many requests as you want. Therefore, |
1607 | for my $path (...) { |
1565 | C<max_outstanding> is mainly useful in simple scripts (with low values) or |
1608 | aio_stat $path , ...; |
1566 | as a stop gap to shield against fatal memory overflow (with large values). |
1609 | IO::AIO::poll_cb; |
|
|
1610 | } |
|
|
1611 | |
|
|
1612 | IO::AIO::flush; |
|
|
1613 | |
|
|
1614 | The call to C<poll_cb> inside the loop will normally return instantly, but |
|
|
1615 | as soon as more thna C<32> reqeusts are in-flight, it will block until |
|
|
1616 | some requests have been handled. This keeps the loop from pushing a large |
|
|
1617 | number of C<aio_stat> requests onto the queue. |
|
|
1618 | |
|
|
1619 | The default value for C<max_outstanding> is very large, so there is no |
|
|
1620 | practical limit on the number of outstanding requests. |
1567 | |
1621 | |
1568 | =back |
1622 | =back |
1569 | |
1623 | |
1570 | =head3 STATISTICAL INFORMATION |
1624 | =head3 STATISTICAL INFORMATION |
1571 | |
1625 | |
… | |
… | |
1747 | Danga::Socket->AddOtherFds (IO::AIO::poll_fileno => |
1801 | Danga::Socket->AddOtherFds (IO::AIO::poll_fileno => |
1748 | \&IO::AIO::poll_cb); |
1802 | \&IO::AIO::poll_cb); |
1749 | |
1803 | |
1750 | =head2 FORK BEHAVIOUR |
1804 | =head2 FORK BEHAVIOUR |
1751 | |
1805 | |
1752 | This module should do "the right thing" when the process using it forks: |
1806 | Usage of pthreads in a program changes the semantics of fork |
|
|
1807 | considerably. Specifically, only async-safe functions can be called after |
|
|
1808 | fork. Perl doesn't know about this, so in general, you cannot call fork |
|
|
1809 | with defined behaviour in perl. IO::AIO uses pthreads, so this applies, |
|
|
1810 | but many other extensions and (for inexplicable reasons) perl itself often |
|
|
1811 | is linked against pthreads, so this limitation applies. |
1753 | |
1812 | |
1754 | Before the fork, IO::AIO enters a quiescent state where no requests |
1813 | Some operating systems have extensions that allow safe use of fork, and |
1755 | can be added in other threads and no results will be processed. After |
1814 | this module should do "the right thing" on those, and tries on others. At |
1756 | the fork the parent simply leaves the quiescent state and continues |
1815 | the time of this writing (2011) only GNU/Linux supports these extensions |
1757 | request/result processing, while the child frees the request/result queue |
1816 | to POSIX. |
1758 | (so that the requests started before the fork will only be handled in the |
|
|
1759 | parent). Threads will be started on demand until the limit set in the |
|
|
1760 | parent process has been reached again. |
|
|
1761 | |
|
|
1762 | In short: the parent will, after a short pause, continue as if fork had |
|
|
1763 | not been called, while the child will act as if IO::AIO has not been used |
|
|
1764 | yet. |
|
|
1765 | |
1817 | |
1766 | =head2 MEMORY USAGE |
1818 | =head2 MEMORY USAGE |
1767 | |
1819 | |
1768 | Per-request usage: |
1820 | Per-request usage: |
1769 | |
1821 | |