package AnyEvent::Handle; no warnings; use strict; use AnyEvent (); use AnyEvent::Util (); use Scalar::Util (); use Carp (); use Fcntl (); use Errno qw/EAGAIN EINTR/; =head1 NAME AnyEvent::Handle - non-blocking I/O on filehandles via AnyEvent =cut our $VERSION = '0.02'; =head1 SYNOPSIS use AnyEvent; use AnyEvent::Handle; my $cv = AnyEvent->condvar; my $ae_fh = AnyEvent::Handle->new (fh => \*STDIN); #TODO # or use the constructor to pass the callback: my $ae_fh2 = AnyEvent::Handle->new ( fh => \*STDIN, on_eof => sub { $cv->broadcast; }, #TODO ); $cv->wait; =head1 DESCRIPTION This module is a helper module to make it easier to do event-based I/O on filehandles (and sockets, see L for an easy way to make non-blocking resolves and connects). In the following, when the documentation refers to of "bytes" then this means characters. As sysread and syswrite are used for all I/O, their treatment of characters applies to this module as well. All callbacks will be invoked with the handle object as their first argument. =head1 METHODS =over 4 =item B The constructor supports these arguments (all as key => value pairs). =over 4 =item fh => $filehandle [MANDATORY] The filehandle this L object will operate on. NOTE: The filehandle will be set to non-blocking (using AnyEvent::Util::fh_nonblocking). =item on_eof => $cb->($self) [MANDATORY] Set the callback to be called on EOF. =item on_error => $cb->($self) This is the fatal error callback, that is called when, well, a fatal error ocurs, such as not being able to resolve the hostname, failure to connect or a read error. The object will not be in a usable state when this callback has been called. On callback entrance, the value of C<$!> contains the operating system error (or C or C). While not mandatory, it is I recommended to set this callback, as you will not be notified of errors otherwise. The default simply calls die. =item on_read => $cb->($self) This sets the default read callback, which is called when data arrives and no read request is in the queue. To access (and remove data from) the read buffer, use the C<< ->rbuf >> method or acces sthe C<$self->{rbuf}> member directly. When an EOF condition is detected then AnyEvent::Handle will first try to feed all the remaining data to the queued callbacks and C before calling the C callback. If no progress can be made, then a fatal error will be raised (with C<$!> set to C). =item on_drain => $cb->() This sets the callback that is called when the write buffer becomes empty (or when the callback is set and the buffer is empty already). To append to the write buffer, use the C<< ->push_write >> method. =item rbuf_max => If defined, then a fatal error will be raised (with C<$!> set to C) when the read buffer ever (strictly) exceeds this size. This is useful to avoid denial-of-service attacks. For example, a server accepting connections from untrusted sources should be configured to accept only so-and-so much data that it cannot act on (for example, when expecting a line, an attacker could send an unlimited amount of data without a callback ever being called as long as the line isn't finished). =item read_size => The default read block size (the amount of bytes this module will try to read on each [loop iteration). Default: C<4096>. =item low_water_mark => Sets the amount of bytes (default: C<0>) that make up an "empty" write buffer: If the write reaches this size or gets even samller it is considered empty. =back =cut sub new { my $class = shift; my $self = bless { @_ }, $class; $self->{fh} or Carp::croak "mandatory argument fh is missing"; AnyEvent::Util::fh_nonblocking $self->{fh}, 1; $self->on_eof ((delete $self->{on_eof} ) or Carp::croak "mandatory argument on_eof is missing"); $self->on_error (delete $self->{on_error}) if $self->{on_error}; $self->on_drain (delete $self->{on_drain}) if $self->{on_drain}; $self->on_read (delete $self->{on_read} ) if $self->{on_read}; $self->start_read; $self } sub _shutdown { my ($self) = @_; delete $self->{rw}; delete $self->{ww}; delete $self->{fh}; } sub error { my ($self) = @_; { local $!; $self->_shutdown; } if ($self->{on_error}) { $self->{on_error}($self); } else { die "AnyEvent::Handle uncaught fatal error: $!"; } } =item $fh = $handle->fh This method returns the filehandle of the L object. =cut sub fh { $_[0]->{fh} } =item $handle->on_error ($cb) Replace the current C callback (see the C constructor argument). =cut sub on_error { $_[0]{on_error} = $_[1]; } =item $handle->on_eof ($cb) Replace the current C callback (see the C constructor argument). =cut sub on_eof { $_[0]{on_eof} = $_[1]; } ############################################################################# =back =head2 WRITE QUEUE AnyEvent::Handle manages two queues per handle, one for writing and one for reading. The write queue is very simple: you can add data to its end, and AnyEvent::Handle will automatically try to get rid of it for you. When data could be writtena nd the write buffer is shorter then the low water mark, the C callback will be invoked. =over 4 =item $handle->on_drain ($cb) Sets the C callback or clears it (see the description of C in the constructor). =cut sub on_drain { my ($self, $cb) = @_; $self->{on_drain} = $cb; $cb->($self) if $cb && $self->{low_water_mark} >= length $self->{wbuf}; } =item $handle->push_write ($data) Queues the given scalar to be written. You can push as much data as you want (only limited by the available memory), as C buffers it independently of the kernel. =cut sub push_write { my ($self, $data) = @_; $self->{wbuf} .= $data; unless ($self->{ww}) { Scalar::Util::weaken $self; my $cb = sub { my $len = syswrite $self->{fh}, $self->{wbuf}; if ($len > 0) { substr $self->{wbuf}, 0, $len, ""; $self->{on_drain}($self) if $self->{low_water_mark} >= length $self->{wbuf} && $self->{on_drain}; delete $self->{ww} unless length $self->{wbuf}; } elsif ($! != EAGAIN && $! != EINTR) { $self->error; } }; $self->{ww} = AnyEvent->io (fh => $self->{fh}, poll => "w", cb => $cb); $cb->($self); }; } ############################################################################# =back =head2 READ QUEUE AnyEvent::Handle manages two queues per handle, one for writing and one for reading. The read queue is more complex than the write queue. It can be used in two ways, the "simple" way, using only C and the "complex" way, using a queue. In the simple case, you just install an C callback and whenever new data arrives, it will be called. You can then remove some data (if enough is there) from the read buffer (C<< $handle->rbuf >>) if you want or not. In the more complex case, you want to queue multiple callbacks. In this case, AnyEvent::Handle will call the first queued callback each time new data arrives and removes it when it has done its job (see C, below). This way you can, for example, push three line-reads, followed by reading a chunk of data, and AnyEvent::Handle will execute them in order. Example 1: EPP protocol parser. EPP sends 4 byte length info, followed by the specified number of bytes which give an XML datagram. # in the default state, expect some header bytes $handle->on_read (sub { # some data is here, now queue the length-header-read (4 octets) shift->unshift_read_chunk (4, sub { # header arrived, decode my $len = unpack "N", $_[1]; # now read the payload shift->unshift_read_chunk ($len, sub { my $xml = $_[1]; # handle xml }); }); }); Example 2: Implement a client for a protocol that replies either with "OK" and another line or "ERROR" for one request, and 64 bytes for the second request. Due tot he availability of a full queue, we can just pipeline sending both requests and manipulate the queue as necessary in the callbacks: # request one $handle->push_write ("request 1\015\012"); # we expect "ERROR" or "OK" as response, so push a line read $handle->push_read_line (sub { # if we got an "OK", we have to _prepend_ another line, # so it will be read before the second request reads its 64 bytes # which are already in the queue when this callback is called # we don't do this in case we got an error if ($_[1] eq "OK") { $_[0]->unshift_read_line (sub { my $response = $_[1]; ... }); } }); # request two $handle->push_write ("request 2\015\012"); # simply read 64 bytes, always $handle->push_read_chunk (64, sub { my $response = $_[1]; ... }); =over 4 =cut sub _drain_rbuf { my ($self) = @_; return if exists $self->{in_drain}; local $self->{in_drain} = 1; while (my $len = length $self->{rbuf}) { no strict 'refs'; if (my $cb = shift @{ $self->{queue} }) { if (!$cb->($self)) { if ($self->{eof}) { # no progress can be made (not enough data and no data forthcoming) $! = &Errno::EPIPE; return $self->error; } unshift @{ $self->{queue} }, $cb; return; } } elsif ($self->{on_read}) { $self->{on_read}($self); if ( $self->{eof} # if no further data will arrive && $len == length $self->{rbuf} # and no data has been consumed && !@{ $self->{queue} } # and the queue is still empty && $self->{on_read} # and we still want to read data ) { # then no progress can be made $! = &Errno::EPIPE; return $self->error; } } else { # read side becomes idle delete $self->{rw}; return; } } if ($self->{eof}) { $self->_shutdown; $self->{on_eof}($self); } } =item $handle->on_read ($cb) This replaces the currently set C callback, or clears it (when the new callback is C). See the description of C in the constructor. =cut sub on_read { my ($self, $cb) = @_; $self->{on_read} = $cb; } =item $handle->rbuf Returns the read buffer (as a modifiable lvalue). You can access the read buffer directly as the C<< ->{rbuf} >> member, if you want. NOTE: The read buffer should only be used or modified if the C, C or C methods are used. The other read methods automatically manage the read buffer. =cut sub rbuf : lvalue { $_[0]{rbuf} } =item $handle->push_read ($cb) =item $handle->unshift_read ($cb) Append the given callback to the end of the queue (C) or prepend it (C). The callback is called each time some additional read data arrives. It must check wether enough data is in the read buffer already. If not enough data is available, it must return the empty list or a false value, in which case it will be called repeatedly until enough data is available (or an error condition is detected). If enough data was available, then the callback must remove all data it is interested in (which can be none at all) and return a true value. After returning true, it will be removed from the queue. =cut sub push_read { my ($self, $cb) = @_; push @{ $self->{queue} }, $cb; $self->_drain_rbuf; } sub unshift_read { my ($self, $cb) = @_; push @{ $self->{queue} }, $cb; $self->_drain_rbuf; } =item $handle->push_read_chunk ($len, $cb->($self, $data)) =item $handle->unshift_read_chunk ($len, $cb->($self, $data)) Append the given callback to the end of the queue (C) or prepend it (C). The callback will be called only once C<$len> bytes have been read, and these C<$len> bytes will be passed to the callback. =cut sub _read_chunk($$) { my ($self, $len, $cb) = @_; sub { $len <= length $_[0]{rbuf} or return; $cb->($self, $_[0], substr $_[0]{rbuf}, 0, $len, ""); 1 } } sub push_read_chunk { $_[0]->push_read (&_read_chunk); } sub unshift_read_chunk { $_[0]->unshift_read (&_read_chunk); } =item $handle->push_read_line ([$eol, ]$cb->($self, $line, $eol)) =item $handle->unshift_read_line ([$eol, ]$cb->($self, $line, $eol)) Append the given callback to the end of the queue (C) or prepend it (C). The callback will be called only once a full line (including the end of line marker, C<$eol>) has been read. This line (excluding the end of line marker) will be passed to the callback as second argument (C<$line>), and the end of line marker as the third argument (C<$eol>). The end of line marker, C<$eol>, can be either a string, in which case it will be interpreted as a fixed record end marker, or it can be a regex object (e.g. created by C), in which case it is interpreted as a regular expression. The end of line marker argument C<$eol> is optional, if it is missing (NOT undef), then C is used (which is good for most internet protocols). Partial lines at the end of the stream will never be returned, as they are not marked by the end of line marker. =cut sub _read_line($$) { my $self = shift; my $cb = pop; my $eol = @_ ? shift : qr|(\015?\012)|; my $pos; $eol = qr|(\Q$eol\E)| unless ref $eol; $eol = qr|^(.*?)($eol)|; sub { $_[0]{rbuf} =~ s/$eol// or return; $cb->($self, $1, $2); 1 } } sub push_read_line { $_[0]->push_read (&_read_line); } sub unshift_read_line { $_[0]->unshift_read (&_read_line); } =item $handle->stop_read =item $handle->start_read In rare cases you actually do not want to read anything form the socket. In this case you can call C. Neither C no any queued callbacks will be executed then. To start readign again, call C. =cut sub stop_read { my ($self) = @_; delete $self->{rw}; } sub start_read { my ($self) = @_; unless ($self->{rw} || $self->{eof}) { Scalar::Util::weaken $self; $self->{rw} = AnyEvent->io (fh => $self->{fh}, poll => "r", cb => sub { my $len = sysread $self->{fh}, $self->{rbuf}, $self->{read_size} || 8192, length $self->{rbuf}; if ($len > 0) { if (exists $self->{rbuf_max}) { if ($self->{rbuf_max} < length $self->{rbuf}) { $! = &Errno::ENOSPC; return $self->error; } } } elsif (defined $len) { $self->{eof} = 1; delete $self->{rw}; } elsif ($! != EAGAIN && $! != EINTR) { return $self->error; } $self->_drain_rbuf; }); } } =back =head1 AUTHOR Robin Redeker C<< >>, Marc Lehmann . =cut 1; # End of AnyEvent::Handle