… | |
… | |
3 | use Coro::Event; |
3 | use Coro::Event; |
4 | use Coro::Socket; |
4 | use Coro::Socket; |
5 | use Coro::Signal; |
5 | use Coro::Signal; |
6 | |
6 | |
7 | use HTTP::Date; |
7 | use HTTP::Date; |
|
|
8 | use POSIX (); |
8 | |
9 | |
9 | no utf8; |
10 | no utf8; |
10 | use bytes; |
11 | use bytes; |
11 | |
12 | |
12 | # at least on my machine, this thingy serves files |
13 | # at least on my machine, this thingy serves files |
… | |
… | |
14 | # and quite a bit slower than thttpd :( |
15 | # and quite a bit slower than thttpd :( |
15 | |
16 | |
16 | $SIG{PIPE} = 'IGNORE'; |
17 | $SIG{PIPE} = 'IGNORE'; |
17 | |
18 | |
18 | our $accesslog; |
19 | our $accesslog; |
|
|
20 | our $errorlog; |
|
|
21 | |
|
|
22 | our $NOW; |
|
|
23 | our $HTTP_NOW; |
|
|
24 | |
|
|
25 | Event->timer(interval => 1, hard => 1, cb => sub { |
|
|
26 | $NOW = time; |
|
|
27 | $HTTP_NOW = time2str $NOW; |
|
|
28 | })->now; |
|
|
29 | |
|
|
30 | if ($ERROR_LOG) { |
|
|
31 | use IO::Handle; |
|
|
32 | open $errorlog, ">>$ERROR_LOG" |
|
|
33 | or die "$ERROR_LOG: $!"; |
|
|
34 | $errorlog->autoflush(1); |
|
|
35 | } |
19 | |
36 | |
20 | if ($ACCESS_LOG) { |
37 | if ($ACCESS_LOG) { |
21 | use IO::Handle; |
38 | use IO::Handle; |
22 | open $accesslog, ">>$ACCESS_LOG" |
39 | open $accesslog, ">>$ACCESS_LOG" |
23 | or die "$ACCESS_LOG: $!"; |
40 | or die "$ACCESS_LOG: $!"; |
… | |
… | |
25 | } |
42 | } |
26 | |
43 | |
27 | sub slog { |
44 | sub slog { |
28 | my $level = shift; |
45 | my $level = shift; |
29 | my $format = shift; |
46 | my $format = shift; |
|
|
47 | my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW); |
30 | printf "---: $format\n", @_; |
48 | printf "$NOW: $format\n", @_; |
|
|
49 | printf $errorlog "$NOW: $format\n", @_ if $errorlog; |
31 | } |
50 | } |
32 | |
51 | |
33 | our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; |
52 | our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; |
34 | our $httpevent = new Coro::Signal; |
53 | our $httpevent = new Coro::Signal; |
35 | |
54 | |
36 | our $wait_factor = 0.95; |
55 | our $queue_file = new transferqueue $MAX_TRANSFERS; |
37 | |
56 | our $queue_index = new transferqueue 10; |
38 | our @transfers = ( |
|
|
39 | [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1], |
|
|
40 | [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1], |
|
|
41 | ); |
|
|
42 | |
57 | |
43 | my @newcons; |
58 | my @newcons; |
44 | my @pool; |
59 | my @pool; |
45 | |
60 | |
46 | # one "execution thread" |
61 | # one "execution thread" |
… | |
… | |
49 | if (@newcons) { |
64 | if (@newcons) { |
50 | eval { |
65 | eval { |
51 | conn->new(@{pop @newcons})->handle; |
66 | conn->new(@{pop @newcons})->handle; |
52 | }; |
67 | }; |
53 | slog 1, "$@" if $@ && !ref $@; |
68 | slog 1, "$@" if $@ && !ref $@; |
|
|
69 | |
|
|
70 | $httpevent->broadcast; # only for testing, but doesn't matter much |
|
|
71 | |
54 | $connections->up; |
72 | $connections->up; |
55 | } else { |
73 | } else { |
56 | last if @pool >= $MAX_POOL; |
74 | last if @pool >= $MAX_POOL; |
57 | push @pool, $Coro::current; |
75 | push @pool, $Coro::current; |
58 | schedule; |
76 | schedule; |
… | |
… | |
100 | or die "unable to start server"; |
118 | or die "unable to start server"; |
101 | |
119 | |
102 | listen_on $http_port; |
120 | listen_on $http_port; |
103 | } |
121 | } |
104 | |
122 | |
105 | our $NOW; |
|
|
106 | our $HTTP_NOW; |
|
|
107 | |
|
|
108 | Event->timer(interval => 1, hard => 1, cb => sub { |
|
|
109 | $NOW = time; |
|
|
110 | $HTTP_NOW = time2str $NOW; |
|
|
111 | })->now; |
|
|
112 | |
|
|
113 | package conn; |
123 | package conn; |
114 | |
124 | |
115 | use Socket; |
125 | use Socket; |
116 | use HTTP::Date; |
126 | use HTTP::Date; |
117 | use Convert::Scalar 'weaken'; |
127 | use Convert::Scalar 'weaken'; |
… | |
… | |
149 | my $peername = shift; |
159 | my $peername = shift; |
150 | my $self = bless { fh => $fh }, $class; |
160 | my $self = bless { fh => $fh }, $class; |
151 | my (undef, $iaddr) = unpack_sockaddr_in $peername |
161 | my (undef, $iaddr) = unpack_sockaddr_in $peername |
152 | or $self->err(500, "unable to decode peername"); |
162 | or $self->err(500, "unable to decode peername"); |
153 | |
163 | |
|
|
164 | $self->{remote_addr} = |
154 | $self->{remote_addr} = inet_ntoa $iaddr; |
165 | $self->{remote_id} = inet_ntoa $iaddr; |
155 | $self->{time} = $::NOW; |
166 | $self->{time} = $::NOW; |
156 | |
167 | |
|
|
168 | weaken ($Coro::current->{conn} = $self); |
|
|
169 | |
157 | $::conns++; |
170 | $::conns++; |
|
|
171 | $::maxconns = $::conns if $::conns > $::maxconns; |
158 | |
172 | |
159 | $self; |
173 | $self; |
160 | } |
174 | } |
161 | |
175 | |
162 | sub DESTROY { |
176 | sub DESTROY { |
163 | my $self = shift; |
177 | #my $self = shift; |
164 | $::conns--; |
178 | $::conns--; |
165 | $self->eoconn; |
|
|
166 | } |
|
|
167 | |
|
|
168 | # end of connection |
|
|
169 | sub eoconn { |
|
|
170 | my $self = shift; |
|
|
171 | |
|
|
172 | # clean up hints |
|
|
173 | delete $conn{$self->{remote_id}}{$self*1}; |
|
|
174 | delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1}; |
|
|
175 | |
|
|
176 | $httpevent->broadcast; |
|
|
177 | } |
179 | } |
178 | |
180 | |
179 | sub slog { |
181 | sub slog { |
180 | my $self = shift; |
182 | my $self = shift; |
181 | main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); |
183 | main::slog($_[0], "$self->{remote_id}> $_[1]"); |
182 | } |
184 | } |
183 | |
185 | |
184 | sub response { |
186 | sub response { |
185 | my ($self, $code, $msg, $hdr, $content) = @_; |
187 | my ($self, $code, $msg, $hdr, $content) = @_; |
186 | my $res = "HTTP/1.1 $code $msg\015\012"; |
188 | my $res = "HTTP/1.1 $code $msg\015\012"; |
… | |
… | |
206 | } |
208 | } |
207 | $res .= "\015\012"; |
209 | $res .= "\015\012"; |
208 | |
210 | |
209 | $res .= $content if defined $content and $self->{method} ne "HEAD"; |
211 | $res .= $content if defined $content and $self->{method} ne "HEAD"; |
210 | |
212 | |
211 | my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; |
213 | my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $NOW). |
|
|
214 | " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}. |
|
|
215 | " \"$self->{h}{referer}\"\n"; |
212 | |
216 | |
213 | print $accesslog $log if $accesslog; |
217 | print $accesslog $log if $accesslog; |
214 | print STDERR $log; |
218 | print STDERR $log; |
215 | |
219 | |
216 | $self->{written} += |
220 | $self->{written} += |
… | |
… | |
300 | $id .= "[".$self->{h}{"x-forwarded-for"}."]"; |
304 | $id .= "[".$self->{h}{"x-forwarded-for"}."]"; |
301 | } |
305 | } |
302 | |
306 | |
303 | $self->{remote_id} = $id; |
307 | $self->{remote_id} = $id; |
304 | |
308 | |
|
|
309 | weaken (local $conn{$id}{$self*1} = $self); |
|
|
310 | |
305 | if ($blocked{$id}) { |
311 | if ($blocked{$id}) { |
306 | $self->err_blocked($blocked{$id}) |
312 | $self->err_blocked |
307 | if $blocked{$id} > $::NOW; |
313 | if $blocked{$id}[0] > $::NOW; |
308 | |
314 | |
309 | delete $blocked{$id}; |
315 | delete $blocked{$id}; |
310 | } |
|
|
311 | |
|
|
312 | if (%{$conn{$id}} >= $::MAX_CONN_IP) { |
|
|
313 | my $delay = $::PER_TIMEOUT + $::NOW + 15; |
|
|
314 | while (%{$conn{$id}} >= $::MAX_CONN_IP) { |
|
|
315 | if ($delay < $::NOW) { |
|
|
316 | $self->slog(2, "blocked ip $id"); |
|
|
317 | $self->err_blocked; |
|
|
318 | } else { |
|
|
319 | $httpevent->wait; |
|
|
320 | } |
|
|
321 | } |
|
|
322 | } |
316 | } |
323 | |
317 | |
324 | # find out server name and port |
318 | # find out server name and port |
325 | if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { |
319 | if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { |
326 | $host = $1; |
320 | $host = $1; |
… | |
… | |
337 | $host = inet_ntoa $host; |
331 | $host = inet_ntoa $host; |
338 | } |
332 | } |
339 | |
333 | |
340 | $self->{server_name} = $host; |
334 | $self->{server_name} = $host; |
341 | |
335 | |
342 | # enter ourselves into various lists |
|
|
343 | weaken ($conn{$id}{$self*1} = $self); |
|
|
344 | weaken ($uri{$id}{$self->{uri}}{$self*1} = $self); |
336 | weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self); |
345 | |
337 | |
346 | eval { |
338 | eval { |
347 | $self->map_uri; |
339 | $self->map_uri; |
348 | $self->respond; |
340 | $self->respond; |
349 | }; |
341 | }; |
350 | |
342 | |
351 | $self->eoconn; |
|
|
352 | |
|
|
353 | die if $@ && !ref $@; |
343 | die if $@ && !ref $@; |
354 | |
344 | |
355 | last if $self->{h}{connection} =~ /close/; |
345 | last if $self->{h}{connection} =~ /close/i; |
356 | |
346 | |
357 | $httpevent->broadcast; |
347 | $httpevent->broadcast; |
358 | |
348 | |
359 | $fh->timeout($::PER_TIMEOUT); |
349 | $fh->timeout($::PER_TIMEOUT); |
360 | } |
350 | } |
|
|
351 | } |
|
|
352 | |
|
|
353 | sub block { |
|
|
354 | my $self = shift; |
|
|
355 | |
|
|
356 | $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]]; |
|
|
357 | $self->slog(2, "blocked ip $self->{remote_id}"); |
|
|
358 | $self->err_blocked; |
361 | } |
359 | } |
362 | |
360 | |
363 | # uri => path mapping |
361 | # uri => path mapping |
364 | sub map_uri { |
362 | sub map_uri { |
365 | my $self = shift; |
363 | my $self = shift; |
… | |
… | |
412 | |
410 | |
413 | sub respond { |
411 | sub respond { |
414 | my $self = shift; |
412 | my $self = shift; |
415 | my $path = $self->{path}; |
413 | my $path = $self->{path}; |
416 | |
414 | |
417 | stat $path |
415 | if ($self->{name} =~ s%^/internal/([^/]+)%%) { |
418 | or $self->err(404, "not found"); |
416 | if ($::internal{$1}) { |
419 | |
417 | $::internal{$1}->($self); |
420 | $self->{stat} = [stat _]; |
|
|
421 | |
|
|
422 | # idiotic netscape sends idiotic headers AGAIN |
|
|
423 | my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
|
|
424 | ? str2time $1 : 0; |
|
|
425 | |
|
|
426 | if (-d _ && -r _) { |
|
|
427 | # directory |
|
|
428 | if ($path !~ /\/$/) { |
|
|
429 | # create a redirect to get the trailing "/" |
|
|
430 | # we don't try to avoid the :80 |
|
|
431 | $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" }); |
|
|
432 | } else { |
418 | } else { |
433 | $ims < $self->{stat}[9] |
419 | $self->err(404, "not found"); |
|
|
420 | } |
|
|
421 | } else { |
|
|
422 | |
|
|
423 | stat $path |
434 | or $self->err(304, "not modified"); |
424 | or $self->err(404, "not found"); |
435 | |
425 | |
436 | if (-r "$path/index.html") { |
426 | $self->{stat} = [stat _]; |
437 | # replace directory "size" by index.html filesize |
427 | |
438 | $self->{stat}[7] = (stat ($self->{path} .= "/index.html"))[7]; |
428 | # idiotic netscape sends idiotic headers AGAIN |
439 | $self->handle_file; |
429 | my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
|
|
430 | ? str2time $1 : 0; |
|
|
431 | |
|
|
432 | if (-d _ && -r _) { |
|
|
433 | # directory |
|
|
434 | if ($path !~ /\/$/) { |
|
|
435 | # create a redirect to get the trailing "/" |
|
|
436 | # we don't try to avoid the :80 |
|
|
437 | $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" }); |
440 | } else { |
438 | } else { |
|
|
439 | $ims < $self->{stat}[9] |
|
|
440 | or $self->err(304, "not modified"); |
|
|
441 | |
|
|
442 | if (-r "$path/index.html") { |
|
|
443 | # replace directory "size" by index.html filesize |
|
|
444 | $self->{stat} = [stat ($self->{path} .= "/index.html")]; |
|
|
445 | $self->handle_file($queue_index); |
|
|
446 | } else { |
441 | $self->handle_dir; |
447 | $self->handle_dir; |
442 | } |
448 | } |
443 | } |
449 | } |
444 | } elsif (-f _ && -r _) { |
450 | } elsif (-f _ && -r _) { |
445 | -x _ and $self->err(403, "forbidden"); |
451 | -x _ and $self->err(403, "forbidden"); |
|
|
452 | |
|
|
453 | if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) { |
|
|
454 | my $timeout = $::NOW + 10; |
|
|
455 | while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) { |
|
|
456 | if ($timeout < $::NOW) { |
|
|
457 | $self->block($::BLOCKTIME, "too many connections"); |
|
|
458 | } else { |
|
|
459 | $httpevent->wait; |
|
|
460 | } |
|
|
461 | } |
|
|
462 | } |
|
|
463 | |
446 | $self->handle_file; |
464 | $self->handle_file($queue_file); |
447 | } else { |
465 | } else { |
448 | $self->err(404, "not found"); |
466 | $self->err(404, "not found"); |
|
|
467 | } |
449 | } |
468 | } |
450 | } |
469 | } |
451 | |
470 | |
452 | sub handle_dir { |
471 | sub handle_dir { |
453 | my $self = shift; |
472 | my $self = shift; |
… | |
… | |
455 | |
474 | |
456 | $self->response(200, "ok", |
475 | $self->response(200, "ok", |
457 | { |
476 | { |
458 | "Content-Type" => "text/html", |
477 | "Content-Type" => "text/html", |
459 | "Content-Length" => length $idx, |
478 | "Content-Length" => length $idx, |
|
|
479 | "Last-Modified" => time2str ($self->{stat}[9]), |
460 | }, |
480 | }, |
461 | $idx); |
481 | $idx); |
462 | } |
482 | } |
463 | |
483 | |
464 | sub handle_file { |
484 | sub handle_file { |
465 | my $self = shift; |
485 | my ($self, $queue) = @_; |
466 | my $length = $self->{stat}[7]; |
486 | my $length = $self->{stat}[7]; |
467 | my $queue = $::transfers[$length >= $::TRANSFER_SMALL]; |
|
|
468 | my $hdr = { |
487 | my $hdr = { |
469 | "Last-Modified" => time2str ((stat _)[9]), |
488 | "Last-Modified" => time2str ((stat _)[9]), |
470 | }; |
489 | }; |
471 | |
490 | |
472 | my @code = (200, "ok"); |
491 | my @code = (200, "ok"); |
… | |
… | |
489 | $self->err(416, "not satisfiable", $hdr, ""); |
508 | $self->err(416, "not satisfiable", $hdr, ""); |
490 | |
509 | |
491 | satisfiable: |
510 | satisfiable: |
492 | # check for segmented downloads |
511 | # check for segmented downloads |
493 | if ($l && $::NO_SEGMENTED) { |
512 | if ($l && $::NO_SEGMENTED) { |
494 | my $delay = $::NOW + $::PER_TIMEOUT + 15; |
513 | my $timeout = $::NOW + 15; |
495 | while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { |
514 | while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { |
496 | if ($delay <= $::NOW) { |
515 | if ($timeout <= $::NOW) { |
|
|
516 | $self->block($::BLOCKTIME, "segmented downloads are forbidden"); |
497 | $self->err_segmented_download; |
517 | #$self->err_segmented_download; |
498 | } else { |
518 | } else { |
499 | $httpevent->wait; |
519 | $httpevent->wait; |
500 | } |
520 | } |
501 | } |
521 | } |
502 | } |
522 | } |
… | |
… | |
517 | $self->response(@code, $hdr, ""); |
537 | $self->response(@code, $hdr, ""); |
518 | |
538 | |
519 | if ($self->{method} eq "GET") { |
539 | if ($self->{method} eq "GET") { |
520 | $self->{time} = $::NOW; |
540 | $self->{time} = $::NOW; |
521 | |
541 | |
522 | my $fudge = $queue->[0]->waiters; |
542 | my $current = $Coro::current; |
523 | $fudge = $fudge ? ($fudge+1)/$fudge : 1; |
|
|
524 | |
|
|
525 | $queue->[1] *= $fudge; |
|
|
526 | my $transfer = $queue->[0]->guard; |
|
|
527 | |
|
|
528 | if ($fudge != 1) { |
|
|
529 | $queue->[1] /= $fudge; |
|
|
530 | $queue->[1] = $queue->[1] * $::wait_factor |
|
|
531 | + ($::NOW - $self->{time}) * (1 - $::wait_factor); |
|
|
532 | } |
|
|
533 | $self->{time} = $::NOW; |
|
|
534 | |
|
|
535 | $self->{fh}->writable or return; |
|
|
536 | |
543 | |
537 | my ($fh, $buf, $r); |
544 | my ($fh, $buf, $r); |
538 | my $current = $Coro::current; |
545 | |
539 | open $fh, "<", $self->{path} |
546 | open $fh, "<", $self->{path} |
540 | or die "$self->{path}: late open failure ($!)"; |
547 | or die "$self->{path}: late open failure ($!)"; |
541 | |
548 | |
542 | $h -= $l - 1; |
549 | $h -= $l - 1; |
543 | |
550 | |
544 | if (0) { |
551 | if (0) { # !AIO |
545 | if ($l) { |
552 | if ($l) { |
546 | sysseek $fh, $l, 0; |
553 | sysseek $fh, $l, 0; |
547 | } |
554 | } |
548 | } |
555 | } |
|
|
556 | |
|
|
557 | my $transfer = $queue->start_transfer($h); |
|
|
558 | my $locked; |
|
|
559 | my $bufsize = $::WAIT_BUFSIZE; # initial buffer size |
549 | |
560 | |
550 | while ($h > 0) { |
561 | while ($h > 0) { |
|
|
562 | unless ($locked) { |
|
|
563 | if ($locked ||= $transfer->try($::WAIT_INTERVAL)) { |
|
|
564 | $bufsize = $::BUFSIZE; |
|
|
565 | $self->{time} = $::NOW; |
|
|
566 | } |
|
|
567 | } |
|
|
568 | |
|
|
569 | if ($blocked{$self->{remote_id}}) { |
|
|
570 | $self->{h}{connection} = "close"; |
|
|
571 | die bless {}, err::; |
|
|
572 | } |
|
|
573 | |
551 | if (0) { |
574 | if (0) { # !AIO |
552 | sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h |
575 | sysread $fh, $buf, $h > $bufsize ? $bufsize : $h |
553 | or last; |
576 | or last; |
554 | } else { |
577 | } else { |
555 | aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), |
578 | aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h), |
556 | $buf, 0, sub { |
579 | $buf, 0, sub { |
557 | $r = $_[0]; |
580 | $r = $_[0]; |
558 | Coro::ready($current); |
581 | Coro::ready($current); |
559 | }); |
582 | }); |
560 | &Coro::schedule; |
583 | &Coro::schedule; |