ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/AnyEvent/lib/AnyEvent/Handle.pm
(Generate patch)

Comparing AnyEvent/lib/AnyEvent/Handle.pm (file contents):
Revision 1.6 by elmex, Mon Apr 28 09:27:47 2008 UTC vs.
Revision 1.42 by root, Tue May 27 06:23:15 2008 UTC

1package AnyEvent::Handle; 1package AnyEvent::Handle;
2 2
3no warnings; 3no warnings;
4use strict; 4use strict;
5 5
6use AnyEvent; 6use AnyEvent ();
7use IO::Handle; 7use AnyEvent::Util qw(WSAEWOULDBLOCK);
8use Scalar::Util ();
9use Carp ();
10use Fcntl ();
8use Errno qw/EAGAIN EINTR/; 11use Errno qw/EAGAIN EINTR/;
9 12
10=head1 NAME 13=head1 NAME
11 14
12AnyEvent::Handle - non-blocking I/O on filehandles via AnyEvent 15AnyEvent::Handle - non-blocking I/O on file handles via AnyEvent
13 16
14=head1 VERSION
15
16Version 0.01
17
18=cut 17=cut
19 18
20our $VERSION = '0.01'; 19our $VERSION = '0.04';
21 20
22=head1 SYNOPSIS 21=head1 SYNOPSIS
23 22
24 use AnyEvent; 23 use AnyEvent;
25 use AnyEvent::Handle; 24 use AnyEvent::Handle;
26 25
27 my $cv = AnyEvent->condvar; 26 my $cv = AnyEvent->condvar;
28 27
29 my $ae_fh = AnyEvent::Handle->new (fh => \*STDIN); 28 my $handle =
30
31 $ae_fh->on_eof (sub { $cv->broadcast });
32
33 $ae_fh->readlines (sub {
34 my ($ae_fh, @lines) = @_;
35 for (@lines) {
36 chomp;
37 print "Line: $_";
38 }
39 });
40
41 # or use the constructor to pass the callback:
42
43 my $ae_fh2 =
44 AnyEvent::Handle->new ( 29 AnyEvent::Handle->new (
45 fh => \*STDIN, 30 fh => \*STDIN,
46 on_eof => sub { 31 on_eof => sub {
47 $cv->broadcast; 32 $cv->broadcast;
48 }, 33 },
49 on_readline => sub { 34 );
35
36 # send some request line
37 $handle->push_write ("getinfo\015\012");
38
39 # read the response line
40 $handle->push_read (line => sub {
50 my ($ae_fh, @lines) = @_; 41 my ($handle, $line) = @_;
51 for (@lines) { 42 warn "read line <$line>\n";
52 chomp; 43 $cv->send;
53 print "Line: $_"; 44 });
45
46 $cv->recv;
47
48=head1 DESCRIPTION
49
50This module is a helper module to make it easier to do event-based I/O on
51filehandles. For utility functions for doing non-blocking connects and accepts
52on sockets see L<AnyEvent::Util>.
53
54In the following, when the documentation refers to of "bytes" then this
55means characters. As sysread and syswrite are used for all I/O, their
56treatment of characters applies to this module as well.
57
58All callbacks will be invoked with the handle object as their first
59argument.
60
61=head1 METHODS
62
63=over 4
64
65=item B<new (%args)>
66
67The constructor supports these arguments (all as key => value pairs).
68
69=over 4
70
71=item fh => $filehandle [MANDATORY]
72
73The filehandle this L<AnyEvent::Handle> object will operate on.
74
75NOTE: The filehandle will be set to non-blocking (using
76AnyEvent::Util::fh_nonblocking).
77
78=item on_eof => $cb->($handle)
79
80Set the callback to be called on EOF.
81
82While not mandatory, it is highly recommended to set an eof callback,
83otherwise you might end up with a closed socket while you are still
84waiting for data.
85
86=item on_error => $cb->($handle)
87
88This is the fatal error callback, that is called when, well, a fatal error
89occurs, such as not being able to resolve the hostname, failure to connect
90or a read error.
91
92The object will not be in a usable state when this callback has been
93called.
94
95On callback entrance, the value of C<$!> contains the operating system
96error (or C<ENOSPC>, C<EPIPE> or C<EBADMSG>).
97
98The callback should throw an exception. If it returns, then
99AnyEvent::Handle will C<croak> for you.
100
101While not mandatory, it is I<highly> recommended to set this callback, as
102you will not be notified of errors otherwise. The default simply calls
103die.
104
105=item on_read => $cb->($handle)
106
107This sets the default read callback, which is called when data arrives
108and no read request is in the queue.
109
110To access (and remove data from) the read buffer, use the C<< ->rbuf >>
111method or access the C<$handle->{rbuf}> member directly.
112
113When an EOF condition is detected then AnyEvent::Handle will first try to
114feed all the remaining data to the queued callbacks and C<on_read> before
115calling the C<on_eof> callback. If no progress can be made, then a fatal
116error will be raised (with C<$!> set to C<EPIPE>).
117
118=item on_drain => $cb->($handle)
119
120This sets the callback that is called when the write buffer becomes empty
121(or when the callback is set and the buffer is empty already).
122
123To append to the write buffer, use the C<< ->push_write >> method.
124
125=item rbuf_max => <bytes>
126
127If defined, then a fatal error will be raised (with C<$!> set to C<ENOSPC>)
128when the read buffer ever (strictly) exceeds this size. This is useful to
129avoid denial-of-service attacks.
130
131For example, a server accepting connections from untrusted sources should
132be configured to accept only so-and-so much data that it cannot act on
133(for example, when expecting a line, an attacker could send an unlimited
134amount of data without a callback ever being called as long as the line
135isn't finished).
136
137=item read_size => <bytes>
138
139The default read block size (the amount of bytes this module will try to read
140on each [loop iteration). Default: C<4096>.
141
142=item low_water_mark => <bytes>
143
144Sets the amount of bytes (default: C<0>) that make up an "empty" write
145buffer: If the write reaches this size or gets even samller it is
146considered empty.
147
148=item tls => "accept" | "connect" | Net::SSLeay::SSL object
149
150When this parameter is given, it enables TLS (SSL) mode, that means it
151will start making tls handshake and will transparently encrypt/decrypt
152data.
153
154TLS mode requires Net::SSLeay to be installed (it will be loaded
155automatically when you try to create a TLS handle).
156
157For the TLS server side, use C<accept>, and for the TLS client side of a
158connection, use C<connect> mode.
159
160You can also provide your own TLS connection object, but you have
161to make sure that you call either C<Net::SSLeay::set_connect_state>
162or C<Net::SSLeay::set_accept_state> on it before you pass it to
163AnyEvent::Handle.
164
165See the C<starttls> method if you need to start TLs negotiation later.
166
167=item tls_ctx => $ssl_ctx
168
169Use the given Net::SSLeay::CTX object to create the new TLS connection
170(unless a connection object was specified directly). If this parameter is
171missing, then AnyEvent::Handle will use C<AnyEvent::Handle::TLS_CTX>.
172
173=item json => JSON or JSON::XS object
174
175This is the json coder object used by the C<json> read and write types.
176
177If you don't supply it, then AnyEvent::Handle will create and use a
178suitable one, which will write and expect UTF-8 encoded JSON texts.
179
180Note that you are responsible to depend on the JSON module if you want to
181use this functionality, as AnyEvent does not have a dependency itself.
182
183=item filter_r => $cb
184
185=item filter_w => $cb
186
187These exist, but are undocumented at this time.
188
189=back
190
191=cut
192
193sub new {
194 my $class = shift;
195
196 my $self = bless { @_ }, $class;
197
198 $self->{fh} or Carp::croak "mandatory argument fh is missing";
199
200 AnyEvent::Util::fh_nonblocking $self->{fh}, 1;
201
202 if ($self->{tls}) {
203 require Net::SSLeay;
204 $self->starttls (delete $self->{tls}, delete $self->{tls_ctx});
205 }
206
207 $self->on_eof (delete $self->{on_eof} ) if $self->{on_eof};
208 $self->on_error (delete $self->{on_error}) if $self->{on_error};
209 $self->on_drain (delete $self->{on_drain}) if $self->{on_drain};
210 $self->on_read (delete $self->{on_read} ) if $self->{on_read};
211
212 $self->start_read;
213
214 $self
215}
216
217sub _shutdown {
218 my ($self) = @_;
219
220 delete $self->{_rw};
221 delete $self->{_ww};
222 delete $self->{fh};
223}
224
225sub error {
226 my ($self) = @_;
227
228 {
229 local $!;
230 $self->_shutdown;
231 }
232
233 $self->{on_error}($self)
234 if $self->{on_error};
235
236 Carp::croak "AnyEvent::Handle uncaught fatal error: $!";
237}
238
239=item $fh = $handle->fh
240
241This method returns the file handle of the L<AnyEvent::Handle> object.
242
243=cut
244
245sub fh { $_[0]{fh} }
246
247=item $handle->on_error ($cb)
248
249Replace the current C<on_error> callback (see the C<on_error> constructor argument).
250
251=cut
252
253sub on_error {
254 $_[0]{on_error} = $_[1];
255}
256
257=item $handle->on_eof ($cb)
258
259Replace the current C<on_eof> callback (see the C<on_eof> constructor argument).
260
261=cut
262
263sub on_eof {
264 $_[0]{on_eof} = $_[1];
265}
266
267#############################################################################
268
269=back
270
271=head2 WRITE QUEUE
272
273AnyEvent::Handle manages two queues per handle, one for writing and one
274for reading.
275
276The write queue is very simple: you can add data to its end, and
277AnyEvent::Handle will automatically try to get rid of it for you.
278
279When data could be written and the write buffer is shorter then the low
280water mark, the C<on_drain> callback will be invoked.
281
282=over 4
283
284=item $handle->on_drain ($cb)
285
286Sets the C<on_drain> callback or clears it (see the description of
287C<on_drain> in the constructor).
288
289=cut
290
291sub on_drain {
292 my ($self, $cb) = @_;
293
294 $self->{on_drain} = $cb;
295
296 $cb->($self)
297 if $cb && $self->{low_water_mark} >= length $self->{wbuf};
298}
299
300=item $handle->push_write ($data)
301
302Queues the given scalar to be written. You can push as much data as you
303want (only limited by the available memory), as C<AnyEvent::Handle>
304buffers it independently of the kernel.
305
306=cut
307
308sub _drain_wbuf {
309 my ($self) = @_;
310
311 if (!$self->{_ww} && length $self->{wbuf}) {
312
313 Scalar::Util::weaken $self;
314
315 my $cb = sub {
316 my $len = syswrite $self->{fh}, $self->{wbuf};
317
318 if ($len >= 0) {
319 substr $self->{wbuf}, 0, $len, "";
320
321 $self->{on_drain}($self)
322 if $self->{low_water_mark} >= length $self->{wbuf}
323 && $self->{on_drain};
324
325 delete $self->{_ww} unless length $self->{wbuf};
326 } elsif ($! != EAGAIN && $! != EINTR && $! != WSAEWOULDBLOCK) {
327 $self->error;
328 }
329 };
330
331 # try to write data immediately
332 $cb->();
333
334 # if still data left in wbuf, we need to poll
335 $self->{_ww} = AnyEvent->io (fh => $self->{fh}, poll => "w", cb => $cb)
336 if length $self->{wbuf};
337 };
338}
339
340our %WH;
341
342sub register_write_type($$) {
343 $WH{$_[0]} = $_[1];
344}
345
346sub push_write {
347 my $self = shift;
348
349 if (@_ > 1) {
350 my $type = shift;
351
352 @_ = ($WH{$type} or Carp::croak "unsupported type passed to AnyEvent::Handle::push_write")
353 ->($self, @_);
354 }
355
356 if ($self->{filter_w}) {
357 $self->{filter_w}->($self, \$_[0]);
358 } else {
359 $self->{wbuf} .= $_[0];
360 $self->_drain_wbuf;
361 }
362}
363
364=item $handle->push_write (type => @args)
365
366=item $handle->unshift_write (type => @args)
367
368Instead of formatting your data yourself, you can also let this module do
369the job by specifying a type and type-specific arguments.
370
371Predefined types are (if you have ideas for additional types, feel free to
372drop by and tell us):
373
374=over 4
375
376=item netstring => $string
377
378Formats the given value as netstring
379(http://cr.yp.to/proto/netstrings.txt, this is not a recommendation to use them).
380
381=back
382
383=cut
384
385register_write_type netstring => sub {
386 my ($self, $string) = @_;
387
388 sprintf "%d:%s,", (length $string), $string
389};
390
391=item json => $array_or_hashref
392
393Encodes the given hash or array reference into a JSON object. Unless you
394provide your own JSON object, this means it will be encoded to JSON text
395in UTF-8.
396
397JSON objects (and arrays) are self-delimiting, so you can write JSON at
398one end of a handle and read them at the other end without using any
399additional framing.
400
401The generated JSON text is guaranteed not to contain any newlines: While
402this module doesn't need delimiters after or between JSON texts to be
403able to read them, many other languages depend on that.
404
405A simple RPC protocol that interoperates easily with others is to send
406JSON arrays (or objects, although arrays are usually the better choice as
407they mimic how function argument passing works) and a newline after each
408JSON text:
409
410 $handle->push_write (json => ["method", "arg1", "arg2"]); # whatever
411 $handle->push_write ("\012");
412
413An AnyEvent::Handle receiver would simply use the C<json> read type and
414rely on the fact that the newline will be skipped as leading whitespace:
415
416 $handle->push_read (json => sub { my $array = $_[1]; ... });
417
418Other languages could read single lines terminated by a newline and pass
419this line into their JSON decoder of choice.
420
421=cut
422
423register_write_type json => sub {
424 my ($self, $ref) = @_;
425
426 require JSON;
427
428 $self->{json} ? $self->{json}->encode ($ref)
429 : JSON::encode_json ($ref)
430};
431
432=item AnyEvent::Handle::register_write_type type => $coderef->($handle, @args)
433
434This function (not method) lets you add your own types to C<push_write>.
435Whenever the given C<type> is used, C<push_write> will invoke the code
436reference with the handle object and the remaining arguments.
437
438The code reference is supposed to return a single octet string that will
439be appended to the write buffer.
440
441Note that this is a function, and all types registered this way will be
442global, so try to use unique names.
443
444=cut
445
446#############################################################################
447
448=back
449
450=head2 READ QUEUE
451
452AnyEvent::Handle manages two queues per handle, one for writing and one
453for reading.
454
455The read queue is more complex than the write queue. It can be used in two
456ways, the "simple" way, using only C<on_read> and the "complex" way, using
457a queue.
458
459In the simple case, you just install an C<on_read> callback and whenever
460new data arrives, it will be called. You can then remove some data (if
461enough is there) from the read buffer (C<< $handle->rbuf >>) if you want
462or not.
463
464In the more complex case, you want to queue multiple callbacks. In this
465case, AnyEvent::Handle will call the first queued callback each time new
466data arrives and removes it when it has done its job (see C<push_read>,
467below).
468
469This way you can, for example, push three line-reads, followed by reading
470a chunk of data, and AnyEvent::Handle will execute them in order.
471
472Example 1: EPP protocol parser. EPP sends 4 byte length info, followed by
473the specified number of bytes which give an XML datagram.
474
475 # in the default state, expect some header bytes
476 $handle->on_read (sub {
477 # some data is here, now queue the length-header-read (4 octets)
478 shift->unshift_read_chunk (4, sub {
479 # header arrived, decode
480 my $len = unpack "N", $_[1];
481
482 # now read the payload
483 shift->unshift_read_chunk ($len, sub {
484 my $xml = $_[1];
485 # handle xml
486 });
487 });
488 });
489
490Example 2: Implement a client for a protocol that replies either with
491"OK" and another line or "ERROR" for one request, and 64 bytes for the
492second request. Due tot he availability of a full queue, we can just
493pipeline sending both requests and manipulate the queue as necessary in
494the callbacks:
495
496 # request one
497 $handle->push_write ("request 1\015\012");
498
499 # we expect "ERROR" or "OK" as response, so push a line read
500 $handle->push_read_line (sub {
501 # if we got an "OK", we have to _prepend_ another line,
502 # so it will be read before the second request reads its 64 bytes
503 # which are already in the queue when this callback is called
504 # we don't do this in case we got an error
505 if ($_[1] eq "OK") {
506 $_[0]->unshift_read_line (sub {
507 my $response = $_[1];
508 ...
509 });
510 }
511 });
512
513 # request two
514 $handle->push_write ("request 2\015\012");
515
516 # simply read 64 bytes, always
517 $handle->push_read_chunk (64, sub {
518 my $response = $_[1];
519 ...
520 });
521
522=over 4
523
524=cut
525
526sub _drain_rbuf {
527 my ($self) = @_;
528
529 if (
530 defined $self->{rbuf_max}
531 && $self->{rbuf_max} < length $self->{rbuf}
532 ) {
533 $! = &Errno::ENOSPC;
534 $self->error;
535 }
536
537 return if $self->{in_drain};
538 local $self->{in_drain} = 1;
539
540 while (my $len = length $self->{rbuf}) {
541 no strict 'refs';
542 if (my $cb = shift @{ $self->{_queue} }) {
543 unless ($cb->($self)) {
544 if ($self->{_eof}) {
545 # no progress can be made (not enough data and no data forthcoming)
546 $! = &Errno::EPIPE;
547 $self->error;
54 } 548 }
549
550 unshift @{ $self->{_queue} }, $cb;
551 return;
55 } 552 }
56 );
57
58 $cv->wait;
59
60=head1 DESCRIPTION
61
62This module is a helper module to make it easier to do non-blocking I/O
63on filehandles (and sockets, see L<AnyEvent::Socket>).
64
65The event loop is provided by L<AnyEvent>.
66
67=head1 METHODS
68
69=over 4
70
71=item B<new (%args)>
72
73The constructor has these arguments:
74
75=over 4
76
77=item fh => $filehandle
78
79The filehandle this L<AnyEvent::Handle> object will operate on.
80
81NOTE: The filehandle will be set to non-blocking.
82
83=item read_block_size => $size
84
85The default read block size use for reads via the C<on_read>
86method.
87
88=item on_read => $cb
89
90=item on_eof => $cb
91
92=item on_error => $cb
93
94These are shortcuts, that will call the corresponding method and set the callback to C<$cb>.
95
96=item on_readline => $cb
97
98The C<readlines> method is called with the default seperator and C<$cb> as callback
99for you.
100
101=back
102
103=cut
104
105sub new {
106 my $this = shift;
107 my $class = ref($this) || $this;
108 my $self = {
109 read_block_size => 4096,
110 rbuf => '',
111 @_
112 };
113 bless $self, $class;
114
115 $self->{fh}->blocking (0) if $self->{fh};
116
117 if ($self->{on_read}) {
118 $self->on_read ($self->{on_read});
119
120 } elsif ($self->{on_readline}) { 553 } elsif ($self->{on_read}) {
121 $self->readlines ($self->{on_readline}); 554 $self->{on_read}($self);
122 555
556 if (
557 $self->{_eof} # if no further data will arrive
558 && $len == length $self->{rbuf} # and no data has been consumed
559 && !@{ $self->{_queue} } # and the queue is still empty
560 && $self->{on_read} # and we still want to read data
561 ) {
562 # then no progress can be made
563 $! = &Errno::EPIPE;
564 $self->error;
565 }
566 } else {
567 # read side becomes idle
568 delete $self->{_rw};
569 return;
570 }
571 }
572
123 } elsif ($self->{on_eof}) { 573 if ($self->{_eof}) {
124 $self->on_eof ($self->{on_eof}); 574 $self->_shutdown;
125 575 $self->{on_eof}($self)
126 } elsif ($self->{on_error}) { 576 if $self->{on_eof};
127 $self->on_eof ($self->{on_error});
128 } 577 }
129
130 return $self
131} 578}
132 579
133=item B<fh> 580=item $handle->on_read ($cb)
134 581
135This method returns the filehandle of the L<AnyEvent::Handle> object. 582This replaces the currently set C<on_read> callback, or clears it (when
136 583the new callback is C<undef>). See the description of C<on_read> in the
137=cut 584constructor.
138
139sub fh { $_[0]->{fh} }
140
141=item B<on_read ($callback)>
142
143This method installs a C<$callback> that will be called
144when new data arrived. You can access the read buffer via the C<rbuf>
145method (see below).
146
147The first argument of the C<$callback> will be the L<AnyEvent::Handle> object.
148 585
149=cut 586=cut
150 587
151sub on_read { 588sub on_read {
152 my ($self, $cb) = @_; 589 my ($self, $cb) = @_;
590
153 $self->{on_read} = $cb; 591 $self->{on_read} = $cb;
592}
154 593
155 unless (defined $self->{on_read}) { 594=item $handle->rbuf
156 delete $self->{on_read_w}; 595
157 return; 596Returns the read buffer (as a modifiable lvalue).
597
598You can access the read buffer directly as the C<< ->{rbuf} >> member, if
599you want.
600
601NOTE: The read buffer should only be used or modified if the C<on_read>,
602C<push_read> or C<unshift_read> methods are used. The other read methods
603automatically manage the read buffer.
604
605=cut
606
607sub rbuf : lvalue {
608 $_[0]{rbuf}
609}
610
611=item $handle->push_read ($cb)
612
613=item $handle->unshift_read ($cb)
614
615Append the given callback to the end of the queue (C<push_read>) or
616prepend it (C<unshift_read>).
617
618The callback is called each time some additional read data arrives.
619
620It must check whether enough data is in the read buffer already.
621
622If not enough data is available, it must return the empty list or a false
623value, in which case it will be called repeatedly until enough data is
624available (or an error condition is detected).
625
626If enough data was available, then the callback must remove all data it is
627interested in (which can be none at all) and return a true value. After returning
628true, it will be removed from the queue.
629
630=cut
631
632our %RH;
633
634sub register_read_type($$) {
635 $RH{$_[0]} = $_[1];
636}
637
638sub push_read {
639 my $self = shift;
640 my $cb = pop;
641
642 if (@_) {
643 my $type = shift;
644
645 $cb = ($RH{$type} or Carp::croak "unsupported type passed to AnyEvent::Handle::push_read")
646 ->($self, $cb, @_);
647 }
648
649 push @{ $self->{_queue} }, $cb;
650 $self->_drain_rbuf;
651}
652
653sub unshift_read {
654 my $self = shift;
655 my $cb = pop;
656
657 if (@_) {
658 my $type = shift;
659
660 $cb = ($RH{$type} or Carp::croak "unsupported type passed to AnyEvent::Handle::unshift_read")
661 ->($self, $cb, @_);
662 }
663
664
665 unshift @{ $self->{_queue} }, $cb;
666 $self->_drain_rbuf;
667}
668
669=item $handle->push_read (type => @args, $cb)
670
671=item $handle->unshift_read (type => @args, $cb)
672
673Instead of providing a callback that parses the data itself you can chose
674between a number of predefined parsing formats, for chunks of data, lines
675etc.
676
677Predefined types are (if you have ideas for additional types, feel free to
678drop by and tell us):
679
680=over 4
681
682=item chunk => $octets, $cb->($handle, $data)
683
684Invoke the callback only once C<$octets> bytes have been read. Pass the
685data read to the callback. The callback will never be called with less
686data.
687
688Example: read 2 bytes.
689
690 $handle->push_read (chunk => 2, sub {
691 warn "yay ", unpack "H*", $_[1];
158 } 692 });
159 693
160 $self->{on_read_w} = 694=cut
161 AnyEvent->io (poll => 'r', fh => $self->{fh}, cb => sub { 695
162 #d# warn "READ:[$self->{read_size}] $self->{read_block_size} : ".length ($self->{rbuf})."\n"; 696register_read_type chunk => sub {
163 my $rbuf_len = length $self->{rbuf}; 697 my ($self, $cb, $len) = @_;
164 my $l; 698
165 if (defined $self->{read_size}) { 699 sub {
166 $l = sysread $self->{fh}, $self->{rbuf}, 700 $len <= length $_[0]{rbuf} or return;
167 ($self->{read_size} - $rbuf_len), $rbuf_len; 701 $cb->($_[0], substr $_[0]{rbuf}, 0, $len, "");
168 } else { 702 1
169 $l = sysread $self->{fh}, $self->{rbuf}, $self->{read_block_size}, $rbuf_len; 703 }
704};
705
706# compatibility with older API
707sub push_read_chunk {
708 $_[0]->push_read (chunk => $_[1], $_[2]);
709}
710
711sub unshift_read_chunk {
712 $_[0]->unshift_read (chunk => $_[1], $_[2]);
713}
714
715=item line => [$eol, ]$cb->($handle, $line, $eol)
716
717The callback will be called only once a full line (including the end of
718line marker, C<$eol>) has been read. This line (excluding the end of line
719marker) will be passed to the callback as second argument (C<$line>), and
720the end of line marker as the third argument (C<$eol>).
721
722The end of line marker, C<$eol>, can be either a string, in which case it
723will be interpreted as a fixed record end marker, or it can be a regex
724object (e.g. created by C<qr>), in which case it is interpreted as a
725regular expression.
726
727The end of line marker argument C<$eol> is optional, if it is missing (NOT
728undef), then C<qr|\015?\012|> is used (which is good for most internet
729protocols).
730
731Partial lines at the end of the stream will never be returned, as they are
732not marked by the end of line marker.
733
734=cut
735
736register_read_type line => sub {
737 my ($self, $cb, $eol) = @_;
738
739 $eol = qr|(\015?\012)| if @_ < 3;
740 $eol = quotemeta $eol unless ref $eol;
741 $eol = qr|^(.*?)($eol)|s;
742
743 sub {
744 $_[0]{rbuf} =~ s/$eol// or return;
745
746 $cb->($_[0], $1, $2);
747 1
748 }
749};
750
751# compatibility with older API
752sub push_read_line {
753 my $self = shift;
754 $self->push_read (line => @_);
755}
756
757sub unshift_read_line {
758 my $self = shift;
759 $self->unshift_read (line => @_);
760}
761
762=item netstring => $cb->($handle, $string)
763
764A netstring (http://cr.yp.to/proto/netstrings.txt, this is not an endorsement).
765
766Throws an error with C<$!> set to EBADMSG on format violations.
767
768=cut
769
770register_read_type netstring => sub {
771 my ($self, $cb) = @_;
772
773 sub {
774 unless ($_[0]{rbuf} =~ s/^(0|[1-9][0-9]*)://) {
775 if ($_[0]{rbuf} =~ /[^0-9]/) {
776 $! = &Errno::EBADMSG;
777 $self->error;
170 } 778 }
171 #d# warn "READL $l [$self->{rbuf}]\n"; 779 return;
780 }
172 781
173 if (not defined $l) { 782 my $len = $1;
174 return if $! == EAGAIN || $! == EINTR;
175 $self->{on_error}->($self) if $self->{on_error};
176 delete $self->{on_read_w};
177 783
178 } elsif ($l == 0) { 784 $self->unshift_read (chunk => $len, sub {
179 $self->{on_eof}->($self) if $self->{on_eof}; 785 my $string = $_[1];
180 delete $self->{on_read_w}; 786 $_[0]->unshift_read (chunk => 1, sub {
181 787 if ($_[1] eq ",") {
788 $cb->($_[0], $string);
182 } else { 789 } else {
183 $self->{on_read}->($self); 790 $! = &Errno::EBADMSG;
791 $self->error;
792 }
793 });
794 });
795
796 1
797 }
798};
799
800=item regex => $accept[, $reject[, $skip], $cb->($handle, $data)
801
802Makes a regex match against the regex object C<$accept> and returns
803everything up to and including the match.
804
805Example: read a single line terminated by '\n'.
806
807 $handle->push_read (regex => qr<\n>, sub { ... });
808
809If C<$reject> is given and not undef, then it determines when the data is
810to be rejected: it is matched against the data when the C<$accept> regex
811does not match and generates an C<EBADMSG> error when it matches. This is
812useful to quickly reject wrong data (to avoid waiting for a timeout or a
813receive buffer overflow).
814
815Example: expect a single decimal number followed by whitespace, reject
816anything else (not the use of an anchor).
817
818 $handle->push_read (regex => qr<^[0-9]+\s>, qr<[^0-9]>, sub { ... });
819
820If C<$skip> is given and not C<undef>, then it will be matched against
821the receive buffer when neither C<$accept> nor C<$reject> match,
822and everything preceding and including the match will be accepted
823unconditionally. This is useful to skip large amounts of data that you
824know cannot be matched, so that the C<$accept> or C<$reject> regex do not
825have to start matching from the beginning. This is purely an optimisation
826and is usually worth only when you expect more than a few kilobytes.
827
828Example: expect a http header, which ends at C<\015\012\015\012>. Since we
829expect the header to be very large (it isn't in practise, but...), we use
830a skip regex to skip initial portions. The skip regex is tricky in that
831it only accepts something not ending in either \015 or \012, as these are
832required for the accept regex.
833
834 $handle->push_read (regex =>
835 qr<\015\012\015\012>,
836 undef, # no reject
837 qr<^.*[^\015\012]>,
838 sub { ... });
839
840=cut
841
842register_read_type regex => sub {
843 my ($self, $cb, $accept, $reject, $skip) = @_;
844
845 my $data;
846 my $rbuf = \$self->{rbuf};
847
848 sub {
849 # accept
850 if ($$rbuf =~ $accept) {
851 $data .= substr $$rbuf, 0, $+[0], "";
852 $cb->($self, $data);
853 return 1;
854 }
855
856 # reject
857 if ($reject && $$rbuf =~ $reject) {
858 $! = &Errno::EBADMSG;
859 $self->error;
860 }
861
862 # skip
863 if ($skip && $$rbuf =~ $skip) {
864 $data .= substr $$rbuf, 0, $+[0], "";
865 }
866
867 ()
868 }
869};
870
871=item json => $cb->($handle, $hash_or_arrayref)
872
873Reads a JSON object or array, decodes it and passes it to the callback.
874
875If a C<json> object was passed to the constructor, then that will be used
876for the final decode, otherwise it will create a JSON coder expecting UTF-8.
877
878This read type uses the incremental parser available with JSON version
8792.09 (and JSON::XS version 2.2) and above. You have to provide a
880dependency on your own: this module will load the JSON module, but
881AnyEvent does not depend on it itself.
882
883Since JSON texts are fully self-delimiting, the C<json> read and write
884types are an ideal simple RPC protocol: just exchange JSON datagrams. See
885the C<json> write type description, above, for an actual example.
886
887=cut
888
889register_read_type json => sub {
890 my ($self, $cb, $accept, $reject, $skip) = @_;
891
892 require JSON;
893
894 my $data;
895 my $rbuf = \$self->{rbuf};
896
897 my $json = $self->{json} ||= JSON->new->utf8;
898
899 sub {
900 my $ref = $json->incr_parse ($self->{rbuf});
901
902 if ($ref) {
903 $self->{rbuf} = $json->incr_text;
904 $json->incr_text = "";
905 $cb->($self, $ref);
906
907 1
908 } else {
909 $self->{rbuf} = "";
910 ()
911 }
912 }
913};
914
915=back
916
917=item AnyEvent::Handle::register_read_type type => $coderef->($handle, $cb, @args)
918
919This function (not method) lets you add your own types to C<push_read>.
920
921Whenever the given C<type> is used, C<push_read> will invoke the code
922reference with the handle object, the callback and the remaining
923arguments.
924
925The code reference is supposed to return a callback (usually a closure)
926that works as a plain read callback (see C<< ->push_read ($cb) >>).
927
928It should invoke the passed callback when it is done reading (remember to
929pass C<$handle> as first argument as all other callbacks do that).
930
931Note that this is a function, and all types registered this way will be
932global, so try to use unique names.
933
934For examples, see the source of this module (F<perldoc -m AnyEvent::Handle>,
935search for C<register_read_type>)).
936
937=item $handle->stop_read
938
939=item $handle->start_read
940
941In rare cases you actually do not want to read anything from the
942socket. In this case you can call C<stop_read>. Neither C<on_read> no
943any queued callbacks will be executed then. To start reading again, call
944C<start_read>.
945
946=cut
947
948sub stop_read {
949 my ($self) = @_;
950
951 delete $self->{_rw};
952}
953
954sub start_read {
955 my ($self) = @_;
956
957 unless ($self->{_rw} || $self->{_eof}) {
958 Scalar::Util::weaken $self;
959
960 $self->{_rw} = AnyEvent->io (fh => $self->{fh}, poll => "r", cb => sub {
961 my $rbuf = $self->{filter_r} ? \my $buf : \$self->{rbuf};
962 my $len = sysread $self->{fh}, $$rbuf, $self->{read_size} || 8192, length $$rbuf;
963
964 if ($len > 0) {
965 $self->{filter_r}
966 ? $self->{filter_r}->($self, $rbuf)
967 : $self->_drain_rbuf;
968
969 } elsif (defined $len) {
970 delete $self->{_rw};
971 $self->{_eof} = 1;
972 $self->_drain_rbuf;
973
974 } elsif ($! != EAGAIN && $! != EINTR && $! != WSAEWOULDBLOCK) {
975 return $self->error;
184 } 976 }
185 }); 977 });
978 }
186} 979}
187 980
188=item B<on_error ($callback)> 981sub _dotls {
189
190Whenever a read or write operation resulted in an error the C<$callback>
191will be called.
192
193The first argument of C<$callback> will be the L<AnyEvent::Handle> object itself.
194The error is given as errno in C<$!>.
195
196=cut
197
198sub on_error {
199 $_[0]->{on_error} = $_[1];
200}
201
202=item B<on_eof ($callback)>
203
204Installs the C<$callback> that will be called when the end of file is
205encountered in a read operation this C<$callback> will be called. The first
206argument will be the L<AnyEvent::Handle> object itself.
207
208=cut
209
210sub on_eof {
211 $_[0]->{on_eof} = $_[1];
212}
213
214=item B<rbuf>
215
216Returns a reference to the read buffer.
217
218NOTE: The read buffer should only be used or modified if the C<on_read>
219method is used directly. The C<read> and C<readlines> methods will provide
220the read data to their callbacks.
221
222=cut
223
224sub rbuf : lvalue {
225 $_[0]->{rbuf}
226}
227
228=item B<read ($len, $callback)>
229
230Will read exactly C<$len> bytes from the filehandle and call the C<$callback>
231if done so. The first argument to the C<$callback> will be the L<AnyEvent::Handle>
232object itself and the second argument the read data.
233
234NOTE: This method will override any callbacks installed via the C<on_read> method.
235
236=cut
237
238sub read {
239 my ($self, $len, $cb) = @_; 982 my ($self) = @_;
240 983
241 $self->{read_cb} = $cb; 984 if (length $self->{_tls_wbuf}) {
242 my $old_blk_size = $self->{read_block_size}; 985 while ((my $len = Net::SSLeay::write ($self->{tls}, $self->{_tls_wbuf})) > 0) {
243 $self->{read_block_size} = $len; 986 substr $self->{_tls_wbuf}, 0, $len, "";
244
245 $self->on_read (sub {
246 #d# warn "OFOFO $len || ".length($_[0]->{rbuf})."||\n";
247
248 if ($len == length $_[0]->{rbuf}) {
249 $_[0]->{read_block_size} = $old_blk_size;
250 $_[0]->on_read (undef);
251 $_[0]->{read_cb}->($_[0], (substr $self->{rbuf}, 0, $len, ''));
252 } 987 }
253 }); 988 }
254}
255 989
256=item B<readlines ($callback)> 990 if (defined (my $buf = Net::SSLeay::BIO_read ($self->{_wbio}))) {
257 991 $self->{wbuf} .= $buf;
258=item B<readlines ($sep, $callback)> 992 $self->_drain_wbuf;
259
260This method will read lines from the filehandle, seperated by C<$sep> or C<"\n">
261if C<$sep> is not provided. C<$sep> will be used as "line" seperator.
262
263The C<$callback> will be called when at least one
264line could be read. The first argument to the C<$callback> will be the L<AnyEvent::Handle>
265object itself and the rest of the arguments will be the read lines.
266
267NOTE: This method will override any callbacks installed via the C<on_read> method.
268
269=cut
270
271sub readlines {
272 my ($self, $sep, $cb) = @_;
273
274 if (ref $sep) {
275 $cb = $sep;
276 $sep = "\n";
277
278 } elsif (not defined $sep) {
279 $sep = "\n";
280 } 993 }
281 994
282 my $sep_len = length $sep; 995 while (defined (my $buf = Net::SSLeay::read ($self->{tls}))) {
996 $self->{rbuf} .= $buf;
997 $self->_drain_rbuf;
998 }
283 999
284 $self->{on_readline} = $cb; 1000 my $err = Net::SSLeay::get_error ($self->{tls}, -1);
285 1001
286 $self->on_read (sub { 1002 if ($err!= Net::SSLeay::ERROR_WANT_READ ()) {
287 my @lines; 1003 if ($err == Net::SSLeay::ERROR_SYSCALL ()) {
288 my $rb = \$_[0]->{rbuf}; 1004 $self->error;
289 my $pos; 1005 } elsif ($err == Net::SSLeay::ERROR_SSL ()) {
290 while (($pos = index ($$rb, $sep)) >= 0) { 1006 $! = &Errno::EIO;
291 push @lines, substr $$rb, 0, $pos + $sep_len, ''; 1007 $self->error;
292 } 1008 }
293 $self->{on_readline}->($_[0], @lines); 1009
1010 # all others are fine for our purposes
1011 }
1012}
1013
1014=item $handle->starttls ($tls[, $tls_ctx])
1015
1016Instead of starting TLS negotiation immediately when the AnyEvent::Handle
1017object is created, you can also do that at a later time by calling
1018C<starttls>.
1019
1020The first argument is the same as the C<tls> constructor argument (either
1021C<"connect">, C<"accept"> or an existing Net::SSLeay object).
1022
1023The second argument is the optional C<Net::SSLeay::CTX> object that is
1024used when AnyEvent::Handle has to create its own TLS connection object.
1025
1026The TLS connection object will end up in C<< $handle->{tls} >> after this
1027call and can be used or changed to your liking. Note that the handshake
1028might have already started when this function returns.
1029
1030=cut
1031
1032# TODO: maybe document...
1033sub starttls {
1034 my ($self, $ssl, $ctx) = @_;
1035
1036 $self->stoptls;
1037
1038 if ($ssl eq "accept") {
1039 $ssl = Net::SSLeay::new ($ctx || TLS_CTX ());
1040 Net::SSLeay::set_accept_state ($ssl);
1041 } elsif ($ssl eq "connect") {
1042 $ssl = Net::SSLeay::new ($ctx || TLS_CTX ());
1043 Net::SSLeay::set_connect_state ($ssl);
1044 }
1045
1046 $self->{tls} = $ssl;
1047
1048 # basically, this is deep magic (because SSL_read should have the same issues)
1049 # but the openssl maintainers basically said: "trust us, it just works".
1050 # (unfortunately, we have to hardcode constants because the abysmally misdesigned
1051 # and mismaintained ssleay-module doesn't even offer them).
1052 # http://www.mail-archive.com/openssl-dev@openssl.org/msg22420.html
1053 Net::SSLeay::CTX_set_mode ($self->{tls},
1054 (eval { local $SIG{__DIE__}; Net::SSLeay::MODE_ENABLE_PARTIAL_WRITE () } || 1)
1055 | (eval { local $SIG{__DIE__}; Net::SSLeay::MODE_ACCEPT_MOVING_WRITE_BUFFER () } || 2));
1056
1057 $self->{_rbio} = Net::SSLeay::BIO_new (Net::SSLeay::BIO_s_mem ());
1058 $self->{_wbio} = Net::SSLeay::BIO_new (Net::SSLeay::BIO_s_mem ());
1059
1060 Net::SSLeay::set_bio ($ssl, $self->{_rbio}, $self->{_wbio});
1061
1062 $self->{filter_w} = sub {
1063 $_[0]{_tls_wbuf} .= ${$_[1]};
1064 &_dotls;
294 }); 1065 };
1066 $self->{filter_r} = sub {
1067 Net::SSLeay::BIO_write ($_[0]{_rbio}, ${$_[1]});
1068 &_dotls;
1069 };
295} 1070}
296 1071
297=item B<write ($data)> 1072=item $handle->stoptls
298 1073
299=item B<write ($callback)> 1074Destroys the SSL connection, if any. Partial read or write data will be
1075lost.
300 1076
301=item B<write ($data, $callback)>
302
303This method will write C<$data> to the filehandle and call the C<$callback>
304afterwards. If only C<$callback> is provided it will be called when the
305write buffer becomes empty the next time (or immediately if it already is empty).
306
307=cut 1077=cut
308 1078
309sub write { 1079sub stoptls {
310 my ($self, $data, $cb) = @_;
311 if (ref $data) { $cb = $data; undef $data }
312 push @{$self->{write_bufs}}, [$data, $cb];
313 $self->_check_writer;
314}
315
316sub _check_writer {
317 my ($self) = @_; 1080 my ($self) = @_;
318 1081
319 if ($self->{write_w}) { 1082 Net::SSLeay::free (delete $self->{tls}) if $self->{tls};
320 unless ($self->{write_cb}) {
321 while (@{$self->{write_bufs}} && not defined $self->{write_bufs}->[0]->[1]) {
322 my $wba = shift @{$self->{write_bufs}};
323 $self->{wbuf} .= $wba->[0];
324 }
325 }
326 return;
327 }
328 1083
329 my $wba = shift @{$self->{write_bufs}} 1084 delete $self->{_rbio};
330 or return; 1085 delete $self->{_wbio};
331 1086 delete $self->{_tls_wbuf};
332 unless (defined $wba->[0]) { 1087 delete $self->{filter_r};
333 $wba->[1]->($self) if $wba->[1];
334 $self->_check_writer;
335 return;
336 }
337
338 $self->{wbuf} = $wba->[0];
339 $self->{write_cb} = $wba->[1];
340
341 $self->{write_w} =
342 AnyEvent->io (poll => 'w', fh => $self->{fh}, cb => sub {
343 my $l = syswrite $self->{fh}, $self->{wbuf}, length $self->{wbuf};
344
345 if (not defined $l) {
346 return if $! == EAGAIN || $! == EINTR;
347 delete $self->{write_w}; 1088 delete $self->{filter_w};
348 $self->{on_error}->($self) if $self->{on_error}; 1089}
349 1090
350 } else { 1091sub DESTROY {
351 substr $self->{wbuf}, 0, $l, ''; 1092 my $self = shift;
352 1093
353 if (length ($self->{wbuf}) == 0) { 1094 $self->stoptls;
354 $self->{write_cb}->($self) if $self->{write_cb}; 1095}
355 1096
356 delete $self->{write_w}; 1097=item AnyEvent::Handle::TLS_CTX
357 delete $self->{wbuf};
358 delete $self->{write_cb};
359 1098
360 $self->_check_writer; 1099This function creates and returns the Net::SSLeay::CTX object used by
361 } 1100default for TLS mode.
362 } 1101
363 }); 1102The context is created like this:
1103
1104 Net::SSLeay::load_error_strings;
1105 Net::SSLeay::SSLeay_add_ssl_algorithms;
1106 Net::SSLeay::randomize;
1107
1108 my $CTX = Net::SSLeay::CTX_new;
1109
1110 Net::SSLeay::CTX_set_options $CTX, Net::SSLeay::OP_ALL
1111
1112=cut
1113
1114our $TLS_CTX;
1115
1116sub TLS_CTX() {
1117 $TLS_CTX || do {
1118 require Net::SSLeay;
1119
1120 Net::SSLeay::load_error_strings ();
1121 Net::SSLeay::SSLeay_add_ssl_algorithms ();
1122 Net::SSLeay::randomize ();
1123
1124 $TLS_CTX = Net::SSLeay::CTX_new ();
1125
1126 Net::SSLeay::CTX_set_options ($TLS_CTX, Net::SSLeay::OP_ALL ());
1127
1128 $TLS_CTX
1129 }
364} 1130}
365 1131
366=back 1132=back
367 1133
1134=head1 SUBCLASSING AnyEvent::Handle
1135
1136In many cases, you might want to subclass AnyEvent::Handle.
1137
1138To make this easier, a given version of AnyEvent::Handle uses these
1139conventions:
1140
1141=over 4
1142
1143=item * all constructor arguments become object members.
1144
1145At least initially, when you pass a C<tls>-argument to the constructor it
1146will end up in C<< $handle->{tls} >>. Those members might be changes or
1147mutated later on (for example C<tls> will hold the TLS connection object).
1148
1149=item * other object member names are prefixed with an C<_>.
1150
1151All object members not explicitly documented (internal use) are prefixed
1152with an underscore character, so the remaining non-C<_>-namespace is free
1153for use for subclasses.
1154
1155=item * all members not documented here and not prefixed with an underscore
1156are free to use in subclasses.
1157
1158Of course, new versions of AnyEvent::Handle may introduce more "public"
1159member variables, but thats just life, at least it is documented.
1160
1161=back
1162
368=head1 AUTHOR 1163=head1 AUTHOR
369 1164
370Robin Redeker, C<< <elmex at ta-sa.org> >> 1165Robin Redeker C<< <elmex at ta-sa.org> >>, Marc Lehmann <schmorp@schmorp.de>.
371 1166
372=cut 1167=cut
373 1168
3741; # End of AnyEvent::Handle 11691; # End of AnyEvent::Handle

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines