… | |
… | |
193 | use strict 'vars'; |
193 | use strict 'vars'; |
194 | |
194 | |
195 | use base 'Exporter'; |
195 | use base 'Exporter'; |
196 | |
196 | |
197 | BEGIN { |
197 | BEGIN { |
198 | our $VERSION = '3.19'; |
198 | our $VERSION = '3.2'; |
199 | |
199 | |
200 | our @AIO_REQ = qw(aio_sendfile aio_read aio_write aio_open aio_close |
200 | our @AIO_REQ = qw(aio_sendfile aio_read aio_write aio_open aio_close |
201 | aio_stat aio_lstat aio_unlink aio_rmdir aio_readdir |
201 | aio_stat aio_lstat aio_unlink aio_rmdir aio_readdir aio_readdirx |
202 | aio_scandir aio_symlink aio_readlink aio_sync aio_fsync |
202 | aio_scandir aio_symlink aio_readlink aio_sync aio_fsync |
203 | aio_fdatasync aio_sync_file_range aio_pathsync aio_readahead |
203 | aio_fdatasync aio_sync_file_range aio_pathsync aio_readahead |
204 | aio_rename aio_link aio_move aio_copy aio_group |
204 | aio_rename aio_link aio_move aio_copy aio_group |
205 | aio_nop aio_mknod aio_load aio_rmtree aio_mkdir aio_chown |
205 | aio_nop aio_mknod aio_load aio_rmtree aio_mkdir aio_chown |
206 | aio_chmod aio_utime aio_truncate); |
206 | aio_chmod aio_utime aio_truncate); |
… | |
… | |
533 | |
533 | |
534 | Unlike the POSIX call of the same name, C<aio_readdir> reads an entire |
534 | Unlike the POSIX call of the same name, C<aio_readdir> reads an entire |
535 | directory (i.e. opendir + readdir + closedir). The entries will not be |
535 | directory (i.e. opendir + readdir + closedir). The entries will not be |
536 | sorted, and will B<NOT> include the C<.> and C<..> entries. |
536 | sorted, and will B<NOT> include the C<.> and C<..> entries. |
537 | |
537 | |
538 | The callback a single argument which is either C<undef> or an array-ref |
538 | The callback is passed a single argument which is either C<undef> or an |
539 | with the filenames. |
539 | array-ref with the filenames. |
|
|
540 | |
|
|
541 | |
|
|
542 | =item aio_readdirx $pathname, $flags, $callback->($entries, $flags) |
|
|
543 | |
|
|
544 | Quite similar to C<aio_readdir>, but the C<$flags> argument allows to tune |
|
|
545 | behaviour and output format. In case of an error, C<$entries> will be |
|
|
546 | C<undef>. |
|
|
547 | |
|
|
548 | The flags are a combination of the following constants, ORed together (the |
|
|
549 | flags will also be passed to the callback, possibly modified): |
|
|
550 | |
|
|
551 | =over 4 |
|
|
552 | |
|
|
553 | =item AIO::READDIR_DENTS |
|
|
554 | |
|
|
555 | When this flag is off, then the callback gets an arrayref with of names |
|
|
556 | only (as with C<aio_readdir>), otherwise it gets an arrayref with |
|
|
557 | C<[$name, $inode, $type]> arrayrefs, each describing a single directory |
|
|
558 | entry in more detail. |
|
|
559 | |
|
|
560 | C<$name> is the name of the entry. |
|
|
561 | |
|
|
562 | C<$inode> is the inode number (which might not be exact on systems with 64 |
|
|
563 | bit inode numbers and 32 bit perls). On systems that do not deliver the |
|
|
564 | inode information, this will always be zero. |
|
|
565 | |
|
|
566 | C<$type> is one of the C<AIO::DT_xxx> constants: |
|
|
567 | |
|
|
568 | C<AIO::DT_UNKNOWN>, C<AIO::DT_FIFO>, C<AIO::DT_CHR>, C<AIO::DT_DIR>, |
|
|
569 | C<AIO::DT_BLK>, C<AIO::DT_REG>, C<AIO::DT_LNK>, C<AIO::DT_SOCK>, |
|
|
570 | C<AIO::DT_WHT>. |
|
|
571 | |
|
|
572 | C<AIO::DT_UNKNOWN> means just that: readdir does not know. If you need to |
|
|
573 | know, you have to run stat yourself. Also, for speed reasons, the C<$type> |
|
|
574 | scalars are read-only: you can not modify them. |
|
|
575 | |
|
|
576 | =item AIO::READDIR_DIRS_FIRST |
|
|
577 | |
|
|
578 | When this flag is set, then the names will be returned in an order where |
|
|
579 | likely directories come first. This is useful when you need to quickly |
|
|
580 | find directories, or you want to find all directories while avoiding to |
|
|
581 | stat() each entry. |
|
|
582 | |
|
|
583 | If the system returns type information in readdir, then this is used |
|
|
584 | to find directories directly. Otherwise, likely directories are files |
|
|
585 | beginning with ".", or otherwise files with no dots, of which files with |
|
|
586 | short names are tried first. |
|
|
587 | |
|
|
588 | =item AIO::READDIR_STAT_ORDER |
|
|
589 | |
|
|
590 | When this flag is set, then the names will be returned in an order |
|
|
591 | suitable for stat()'ing each one. That is, when you plan to stat() |
|
|
592 | all files in the given directory, then the returned order will likely |
|
|
593 | be fastest. |
|
|
594 | |
|
|
595 | If both this flag and IO::READDIR_DIRS_FIRST are specified, then the |
|
|
596 | likely dirs come first, resulting in a less optimal stat order. |
|
|
597 | |
|
|
598 | =item AIO::READDIR_FOUND_UNKNOWN |
|
|
599 | |
|
|
600 | This flag should not be set when calling C<aio_readdirx>. Instead, it |
|
|
601 | is being set by C<aio_readdirx>, when any of the C<$type>'s found were |
|
|
602 | C<AIO::DT_UNKNOWN>. The absense of this flag therefore indicates that all |
|
|
603 | C<$type>'s are known, which can be used to speed up some algorithms. |
|
|
604 | |
|
|
605 | =back |
540 | |
606 | |
541 | |
607 | |
542 | =item aio_load $path, $data, $callback->($status) |
608 | =item aio_load $path, $data, $callback->($status) |
543 | |
609 | |
544 | This is a composite request that tries to fully load the given file into |
610 | This is a composite request that tries to fully load the given file into |
… | |
… | |
709 | |
775 | |
710 | Implementation notes. |
776 | Implementation notes. |
711 | |
777 | |
712 | The C<aio_readdir> cannot be avoided, but C<stat()>'ing every entry can. |
778 | The C<aio_readdir> cannot be avoided, but C<stat()>'ing every entry can. |
713 | |
779 | |
|
|
780 | If readdir returns file type information, then this is used directly to |
|
|
781 | find directories. |
|
|
782 | |
714 | After reading the directory, the modification time, size etc. of the |
783 | Otherwise, after reading the directory, the modification time, size etc. |
715 | directory before and after the readdir is checked, and if they match (and |
784 | of the directory before and after the readdir is checked, and if they |
716 | isn't the current time), the link count will be used to decide how many |
785 | match (and isn't the current time), the link count will be used to decide |
717 | entries are directories (if >= 2). Otherwise, no knowledge of the number |
786 | how many entries are directories (if >= 2). Otherwise, no knowledge of the |
718 | of subdirectories will be assumed. |
787 | number of subdirectories will be assumed. |
719 | |
788 | |
720 | Then entries will be sorted into likely directories (everything without |
789 | Then entries will be sorted into likely directories a non-initial dot |
721 | a non-initial dot currently) and likely non-directories (everything |
790 | currently) and likely non-directories (see C<aio_readdirx>). Then every |
722 | else). Then every entry plus an appended C</.> will be C<stat>'ed, |
791 | entry plus an appended C</.> will be C<stat>'ed, likely directories first, |
723 | likely directories first. If that succeeds, it assumes that the entry |
792 | in order of their inode numbers. If that succeeds, it assumes that the |
724 | is a directory or a symlink to directory (which will be checked |
793 | entry is a directory or a symlink to directory (which will be checked |
725 | seperately). This is often faster than stat'ing the entry itself because |
794 | seperately). This is often faster than stat'ing the entry itself because |
726 | filesystems might detect the type of the entry without reading the inode |
795 | filesystems might detect the type of the entry without reading the inode |
727 | data (e.g. ext2fs filetype feature). |
796 | data (e.g. ext2fs filetype feature), even on systems that cannot return |
|
|
797 | the filetype information on readdir. |
728 | |
798 | |
729 | If the known number of directories (link count - 2) has been reached, the |
799 | If the known number of directories (link count - 2) has been reached, the |
730 | rest of the entries is assumed to be non-directories. |
800 | rest of the entries is assumed to be non-directories. |
731 | |
801 | |
732 | This only works with certainty on POSIX (= UNIX) filesystems, which |
802 | This only works with certainty on POSIX (= UNIX) filesystems, which |
… | |
… | |
754 | my $now = time; |
824 | my $now = time; |
755 | my $hash1 = join ":", (stat _)[0,1,3,7,9]; |
825 | my $hash1 = join ":", (stat _)[0,1,3,7,9]; |
756 | |
826 | |
757 | # read the directory entries |
827 | # read the directory entries |
758 | aioreq_pri $pri; |
828 | aioreq_pri $pri; |
759 | add $grp aio_readdir $path, sub { |
829 | add $grp aio_readdirx $path, READDIR_DIRS_FIRST, sub { |
760 | my $entries = shift |
830 | my $entries = shift |
761 | or return $grp->result (); |
831 | or return $grp->result (); |
762 | |
832 | |
763 | # stat the dir another time |
833 | # stat the dir another time |
764 | aioreq_pri $pri; |
834 | aioreq_pri $pri; |
… | |
… | |
774 | # if nlink == 2, we are finished |
844 | # if nlink == 2, we are finished |
775 | # on non-posix-fs's, we rely on nlink < 2 |
845 | # on non-posix-fs's, we rely on nlink < 2 |
776 | $ndirs = (stat _)[3] - 2 |
846 | $ndirs = (stat _)[3] - 2 |
777 | or return $grp->result ([], $entries); |
847 | or return $grp->result ([], $entries); |
778 | } |
848 | } |
779 | |
|
|
780 | # sort into likely dirs and likely nondirs |
|
|
781 | # dirs == files without ".", short entries first |
|
|
782 | $entries = [map $_->[0], |
|
|
783 | sort { $b->[1] cmp $a->[1] } |
|
|
784 | map [$_, sprintf "%s%04d", (/.\./ ? "1" : "0"), length], |
|
|
785 | @$entries]; |
|
|
786 | |
849 | |
787 | my (@dirs, @nondirs); |
850 | my (@dirs, @nondirs); |
788 | |
851 | |
789 | my $statgrp = add $grp aio_group sub { |
852 | my $statgrp = add $grp aio_group sub { |
790 | $grp->result (\@dirs, \@nondirs); |
853 | $grp->result (\@dirs, \@nondirs); |