1 | use Coro; |
1 | use Coro; |
2 | use Coro::Semaphore; |
2 | use Coro::Semaphore; |
3 | use Coro::Event; |
3 | use Coro::Event; |
4 | use Coro::Socket; |
4 | use Coro::Socket; |
|
|
5 | use Coro::Signal; |
5 | |
6 | |
6 | use HTTP::Date; |
7 | use HTTP::Date; |
|
|
8 | use POSIX (); |
7 | |
9 | |
8 | no utf8; |
10 | no utf8; |
9 | use bytes; |
11 | use bytes; |
10 | |
12 | |
11 | # at least on my machine, this thingy serves files |
13 | # at least on my machine, this thingy serves files |
… | |
… | |
13 | # and quite a bit slower than thttpd :( |
15 | # and quite a bit slower than thttpd :( |
14 | |
16 | |
15 | $SIG{PIPE} = 'IGNORE'; |
17 | $SIG{PIPE} = 'IGNORE'; |
16 | |
18 | |
17 | our $accesslog; |
19 | our $accesslog; |
|
|
20 | our $errorlog; |
|
|
21 | |
|
|
22 | our $NOW; |
|
|
23 | our $HTTP_NOW; |
|
|
24 | |
|
|
25 | Event->timer(interval => 1, hard => 1, cb => sub { |
|
|
26 | $NOW = time; |
|
|
27 | $HTTP_NOW = time2str $NOW; |
|
|
28 | })->now; |
|
|
29 | |
|
|
30 | if ($ERROR_LOG) { |
|
|
31 | use IO::Handle; |
|
|
32 | open $errorlog, ">>$ERROR_LOG" |
|
|
33 | or die "$ERROR_LOG: $!"; |
|
|
34 | $errorlog->autoflush(1); |
|
|
35 | } |
18 | |
36 | |
19 | if ($ACCESS_LOG) { |
37 | if ($ACCESS_LOG) { |
20 | use IO::Handle; |
38 | use IO::Handle; |
21 | open $accesslog, ">>$ACCESS_LOG" |
39 | open $accesslog, ">>$ACCESS_LOG" |
22 | or die "$ACCESS_LOG: $!"; |
40 | or die "$ACCESS_LOG: $!"; |
… | |
… | |
24 | } |
42 | } |
25 | |
43 | |
26 | sub slog { |
44 | sub slog { |
27 | my $level = shift; |
45 | my $level = shift; |
28 | my $format = shift; |
46 | my $format = shift; |
|
|
47 | my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW); |
29 | printf "---: $format\n", @_; |
48 | printf "$NOW: $format\n", @_; |
|
|
49 | printf $errorlog "$NOW: $format\n", @_ if $errorlog; |
30 | } |
50 | } |
31 | |
51 | |
32 | our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; |
52 | our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; |
|
|
53 | our $httpevent = new Coro::Signal; |
33 | |
54 | |
34 | our $wait_factor = 0.95; |
55 | our $queue_file = new transferqueue $MAX_TRANSFERS; |
35 | |
56 | our $queue_index = new transferqueue 10; |
36 | our @transfers = ( |
|
|
37 | [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1], |
|
|
38 | [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1], |
|
|
39 | ); |
|
|
40 | |
57 | |
41 | my @newcons; |
58 | my @newcons; |
42 | my @pool; |
59 | my @pool; |
43 | |
60 | |
44 | # one "execution thread" |
61 | # one "execution thread" |
… | |
… | |
47 | if (@newcons) { |
64 | if (@newcons) { |
48 | eval { |
65 | eval { |
49 | conn->new(@{pop @newcons})->handle; |
66 | conn->new(@{pop @newcons})->handle; |
50 | }; |
67 | }; |
51 | slog 1, "$@" if $@ && !ref $@; |
68 | slog 1, "$@" if $@ && !ref $@; |
|
|
69 | |
|
|
70 | $httpevent->broadcast; # only for testing, but doesn't matter much |
|
|
71 | |
52 | $connections->up; |
72 | $connections->up; |
53 | } else { |
73 | } else { |
54 | last if @pool >= $MAX_POOL; |
74 | last if @pool >= $MAX_POOL; |
55 | push @pool, $Coro::current; |
75 | push @pool, $Coro::current; |
56 | schedule; |
76 | schedule; |
… | |
… | |
98 | or die "unable to start server"; |
118 | or die "unable to start server"; |
99 | |
119 | |
100 | listen_on $http_port; |
120 | listen_on $http_port; |
101 | } |
121 | } |
102 | |
122 | |
103 | our $NOW; |
|
|
104 | our $HTTP_NOW; |
|
|
105 | |
|
|
106 | Event->timer(interval => 1, hard => 1, cb => sub { |
|
|
107 | $NOW = time; |
|
|
108 | $HTTP_NOW = time2str $NOW; |
|
|
109 | })->now; |
|
|
110 | |
|
|
111 | package conn; |
123 | package conn; |
112 | |
124 | |
113 | use Socket; |
125 | use Socket; |
114 | use HTTP::Date; |
126 | use HTTP::Date; |
115 | use Convert::Scalar 'weaken'; |
127 | use Convert::Scalar 'weaken'; |
… | |
… | |
147 | my $peername = shift; |
159 | my $peername = shift; |
148 | my $self = bless { fh => $fh }, $class; |
160 | my $self = bless { fh => $fh }, $class; |
149 | my (undef, $iaddr) = unpack_sockaddr_in $peername |
161 | my (undef, $iaddr) = unpack_sockaddr_in $peername |
150 | or $self->err(500, "unable to decode peername"); |
162 | or $self->err(500, "unable to decode peername"); |
151 | |
163 | |
|
|
164 | $self->{remote_addr} = |
152 | $self->{remote_addr} = inet_ntoa $iaddr; |
165 | $self->{remote_id} = inet_ntoa $iaddr; |
|
|
166 | |
153 | $self->{time} = $::NOW; |
167 | $self->{time} = $::NOW; |
154 | |
168 | |
|
|
169 | weaken ($Coro::current->{conn} = $self); |
|
|
170 | |
155 | $::conns++; |
171 | $::conns++; |
|
|
172 | $::maxconns = $::conns if $::conns > $::maxconns; |
156 | |
173 | |
157 | $self; |
174 | $self; |
158 | } |
175 | } |
159 | |
176 | |
160 | sub DESTROY { |
177 | sub DESTROY { |
161 | my $self = shift; |
178 | #my $self = shift; |
162 | $::conns--; |
179 | $::conns--; |
163 | $self->eoconn; |
|
|
164 | } |
|
|
165 | |
|
|
166 | # end of connection |
|
|
167 | sub eoconn { |
|
|
168 | my $self = shift; |
|
|
169 | |
|
|
170 | # clean up hints |
|
|
171 | delete $conn{$self->{remote_id}}{$self*1}; |
|
|
172 | delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1}; |
|
|
173 | } |
180 | } |
174 | |
181 | |
175 | sub slog { |
182 | sub slog { |
176 | my $self = shift; |
183 | my $self = shift; |
177 | main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); |
184 | main::slog($_[0], "$self->{remote_id}> $_[1]"); |
178 | } |
185 | } |
179 | |
186 | |
180 | sub response { |
187 | sub response { |
181 | my ($self, $code, $msg, $hdr, $content) = @_; |
188 | my ($self, $code, $msg, $hdr, $content) = @_; |
182 | my $res = "HTTP/1.1 $code $msg\015\012"; |
189 | my $res = "HTTP/1.1 $code $msg\015\012"; |
183 | |
190 | |
184 | $self->{h}{connection} = "close" if $hdr->{Connection} =~ /close/; |
191 | if (exists $hdr->{Connection}) { |
|
|
192 | if ($hdr->{Connection} =~ /close/) { |
|
|
193 | $self->{h}{connection} = "close" |
|
|
194 | } |
|
|
195 | } else { |
|
|
196 | if ($self->{version} < 1.1) { |
|
|
197 | if ($self->{h}{connection} =~ /keep-alive/i) { |
|
|
198 | $hdr->{Connection} = "Keep-Alive"; |
|
|
199 | } else { |
|
|
200 | $self->{h}{connection} = "close" |
|
|
201 | } |
|
|
202 | } |
|
|
203 | } |
185 | |
204 | |
186 | $res .= "Date: $HTTP_NOW\015\012"; |
205 | $res .= "Date: $HTTP_NOW\015\012"; |
187 | |
206 | |
188 | while (my ($h, $v) = each %$hdr) { |
207 | while (my ($h, $v) = each %$hdr) { |
189 | $res .= "$h: $v\015\012" |
208 | $res .= "$h: $v\015\012" |
190 | } |
209 | } |
191 | $res .= "\015\012"; |
210 | $res .= "\015\012"; |
192 | |
211 | |
193 | $res .= $content if defined $content and $self->{method} ne "HEAD"; |
212 | $res .= $content if defined $content and $self->{method} ne "HEAD"; |
194 | |
213 | |
195 | my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; |
214 | my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $NOW). |
|
|
215 | " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}. |
|
|
216 | " \"$self->{h}{referer}\"\n"; |
196 | |
217 | |
197 | print $accesslog $log if $accesslog; |
218 | print $accesslog $log if $accesslog; |
198 | print STDERR $log; |
219 | print STDERR $log; |
199 | |
220 | |
200 | $self->{written} += |
221 | $self->{written} += |
… | |
… | |
284 | $id .= "[".$self->{h}{"x-forwarded-for"}."]"; |
305 | $id .= "[".$self->{h}{"x-forwarded-for"}."]"; |
285 | } |
306 | } |
286 | |
307 | |
287 | $self->{remote_id} = $id; |
308 | $self->{remote_id} = $id; |
288 | |
309 | |
|
|
310 | weaken (local $conn{$id}{$self*1} = $self); |
|
|
311 | |
289 | if ($blocked{$id}) { |
312 | if ($blocked{$id}) { |
290 | $self->err_blocked($blocked{$id}) |
313 | $self->err_blocked |
291 | if $blocked{$id} > $::NOW; |
314 | if $blocked{$id}[0] > $::NOW; |
292 | |
315 | |
293 | delete $blocked{$id}; |
316 | delete $blocked{$id}; |
294 | } |
|
|
295 | |
|
|
296 | if (%{$conn{$id}} >= $::MAX_CONN_IP) { |
|
|
297 | my $delay = $::PER_TIMEOUT + 15; |
|
|
298 | while (%{$conn{$id}} >= $::MAX_CONN_IP) { |
|
|
299 | if ($delay <= 0) { |
|
|
300 | $self->slog(2, "blocked ip $id"); |
|
|
301 | $self->err_blocked; |
|
|
302 | } else { |
|
|
303 | Coro::Event::do_timer(after => 4); $delay -= 4; |
|
|
304 | } |
|
|
305 | } |
|
|
306 | } |
317 | } |
307 | |
318 | |
308 | # find out server name and port |
319 | # find out server name and port |
309 | if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { |
320 | if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { |
310 | $host = $1; |
321 | $host = $1; |
… | |
… | |
321 | $host = inet_ntoa $host; |
332 | $host = inet_ntoa $host; |
322 | } |
333 | } |
323 | |
334 | |
324 | $self->{server_name} = $host; |
335 | $self->{server_name} = $host; |
325 | |
336 | |
326 | # enter ourselves into various lists |
|
|
327 | weaken ($conn{$id}{$self*1} = $self); |
|
|
328 | weaken ($uri{$id}{$self->{uri}}{$self*1} = $self); |
337 | weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self); |
329 | |
338 | |
330 | eval { |
339 | eval { |
331 | $self->map_uri; |
340 | $self->map_uri; |
332 | $self->respond; |
341 | $self->respond; |
333 | }; |
342 | }; |
334 | |
343 | |
335 | $self->eoconn; |
|
|
336 | |
|
|
337 | die if $@ && !ref $@; |
344 | die if $@ && !ref $@; |
338 | |
345 | |
339 | last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1; |
346 | last if $self->{h}{connection} =~ /close/i; |
|
|
347 | |
|
|
348 | $httpevent->broadcast; |
340 | |
349 | |
341 | $fh->timeout($::PER_TIMEOUT); |
350 | $fh->timeout($::PER_TIMEOUT); |
342 | } |
351 | } |
|
|
352 | } |
|
|
353 | |
|
|
354 | sub block { |
|
|
355 | my $self = shift; |
|
|
356 | |
|
|
357 | $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]]; |
|
|
358 | $self->slog(2, "blocked ip $self->{remote_id}"); |
|
|
359 | $self->err_blocked; |
343 | } |
360 | } |
344 | |
361 | |
345 | # uri => path mapping |
362 | # uri => path mapping |
346 | sub map_uri { |
363 | sub map_uri { |
347 | my $self = shift; |
364 | my $self = shift; |
… | |
… | |
394 | |
411 | |
395 | sub respond { |
412 | sub respond { |
396 | my $self = shift; |
413 | my $self = shift; |
397 | my $path = $self->{path}; |
414 | my $path = $self->{path}; |
398 | |
415 | |
399 | stat $path |
416 | if ($self->{name} =~ s%^/internal/([^/]+)%%) { |
400 | or $self->err(404, "not found"); |
417 | if ($::internal{$1}) { |
401 | |
418 | $::internal{$1}->($self); |
402 | $self->{stat} = [stat _]; |
|
|
403 | |
|
|
404 | # idiotic netscape sends idiotic headers AGAIN |
|
|
405 | my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
|
|
406 | ? str2time $1 : 0; |
|
|
407 | |
|
|
408 | if (-d _ && -r _) { |
|
|
409 | # directory |
|
|
410 | if ($path !~ /\/$/) { |
|
|
411 | # create a redirect to get the trailing "/" |
|
|
412 | # we don't try to avoid the :80 |
|
|
413 | $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" }); |
|
|
414 | } else { |
419 | } else { |
415 | $ims < $self->{stat}[9] |
420 | $self->err(404, "not found"); |
|
|
421 | } |
|
|
422 | } else { |
|
|
423 | |
|
|
424 | stat $path |
416 | or $self->err(304, "not modified"); |
425 | or $self->err(404, "not found"); |
417 | |
426 | |
418 | if (-r "$path/index.html") { |
427 | $self->{stat} = [stat _]; |
419 | $self->{path} .= "/index.html"; |
428 | |
420 | $self->handle_file; |
429 | # idiotic netscape sends idiotic headers AGAIN |
|
|
430 | my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
|
|
431 | ? str2time $1 : 0; |
|
|
432 | |
|
|
433 | if (-d _ && -r _) { |
|
|
434 | # directory |
|
|
435 | if ($path !~ /\/$/) { |
|
|
436 | # create a redirect to get the trailing "/" |
|
|
437 | # we don't try to avoid the :80 |
|
|
438 | $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" }); |
421 | } else { |
439 | } else { |
|
|
440 | $ims < $self->{stat}[9] |
|
|
441 | or $self->err(304, "not modified"); |
|
|
442 | |
|
|
443 | if (-r "$path/index.html") { |
|
|
444 | # replace directory "size" by index.html filesize |
|
|
445 | $self->{stat} = [stat ($self->{path} .= "/index.html")]; |
|
|
446 | $self->handle_file($queue_index); |
|
|
447 | } else { |
422 | $self->handle_dir; |
448 | $self->handle_dir; |
423 | } |
449 | } |
424 | } |
450 | } |
425 | } elsif (-f _ && -r _) { |
451 | } elsif (-f _ && -r _) { |
426 | -x _ and $self->err(403, "forbidden"); |
452 | -x _ and $self->err(403, "forbidden"); |
|
|
453 | |
|
|
454 | if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) { |
|
|
455 | my $timeout = $::NOW + 10; |
|
|
456 | while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) { |
|
|
457 | if ($timeout < $::NOW) { |
|
|
458 | $self->block($::BLOCKTIME, "too many connections"); |
|
|
459 | } else { |
|
|
460 | $httpevent->wait; |
|
|
461 | } |
|
|
462 | } |
|
|
463 | } |
|
|
464 | |
427 | $self->handle_file; |
465 | $self->handle_file($queue_file); |
428 | } else { |
466 | } else { |
429 | $self->err(404, "not found"); |
467 | $self->err(404, "not found"); |
|
|
468 | } |
430 | } |
469 | } |
431 | } |
470 | } |
432 | |
471 | |
433 | sub handle_dir { |
472 | sub handle_dir { |
434 | my $self = shift; |
473 | my $self = shift; |
… | |
… | |
436 | |
475 | |
437 | $self->response(200, "ok", |
476 | $self->response(200, "ok", |
438 | { |
477 | { |
439 | "Content-Type" => "text/html", |
478 | "Content-Type" => "text/html", |
440 | "Content-Length" => length $idx, |
479 | "Content-Length" => length $idx, |
|
|
480 | "Last-Modified" => time2str ($self->{stat}[9]), |
441 | }, |
481 | }, |
442 | $idx); |
482 | $idx); |
443 | } |
483 | } |
444 | |
484 | |
445 | sub handle_file { |
485 | sub handle_file { |
446 | my $self = shift; |
486 | my ($self, $queue) = @_; |
447 | my $length = $self->{stat}[7]; |
487 | my $length = $self->{stat}[7]; |
448 | my $queue = $::transfers[$length >= $::TRANSFER_SMALL]; |
|
|
449 | my $hdr = { |
488 | my $hdr = { |
450 | "Last-Modified" => time2str ((stat _)[9]), |
489 | "Last-Modified" => time2str ((stat _)[9]), |
451 | }; |
490 | }; |
452 | |
491 | |
453 | my @code = (200, "ok"); |
492 | my @code = (200, "ok"); |
… | |
… | |
470 | $self->err(416, "not satisfiable", $hdr, ""); |
509 | $self->err(416, "not satisfiable", $hdr, ""); |
471 | |
510 | |
472 | satisfiable: |
511 | satisfiable: |
473 | # check for segmented downloads |
512 | # check for segmented downloads |
474 | if ($l && $::NO_SEGMENTED) { |
513 | if ($l && $::NO_SEGMENTED) { |
475 | my $delay = $::PER_TIMEOUT + 15; |
514 | my $timeout = $::NOW + 15; |
476 | while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { |
515 | while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { |
477 | if ($delay <= 0) { |
516 | if ($timeout <= $::NOW) { |
|
|
517 | $self->block($::BLOCKTIME, "segmented downloads are forbidden"); |
478 | $self->err_segmented_download; |
518 | #$self->err_segmented_download; |
479 | } else { |
519 | } else { |
480 | Coro::Event::do_timer(after => 4); $delay -= 4; |
520 | $httpevent->wait; |
481 | } |
521 | } |
482 | } |
522 | } |
483 | } |
523 | } |
484 | |
524 | |
485 | $hdr->{"Content-Range"} = "bytes $l-$h/$length"; |
525 | $hdr->{"Content-Range"} = "bytes $l-$h/$length"; |
… | |
… | |
498 | $self->response(@code, $hdr, ""); |
538 | $self->response(@code, $hdr, ""); |
499 | |
539 | |
500 | if ($self->{method} eq "GET") { |
540 | if ($self->{method} eq "GET") { |
501 | $self->{time} = $::NOW; |
541 | $self->{time} = $::NOW; |
502 | |
542 | |
503 | my $fudge = $queue->[0]->waiters; |
543 | my $current = $Coro::current; |
504 | $fudge = $fudge ? ($fudge+1)/$fudge : 1; |
|
|
505 | |
|
|
506 | $queue->[1] *= $fudge; |
|
|
507 | my $transfer = $queue->[0]->guard; |
|
|
508 | |
|
|
509 | if ($fudge != 1) { |
|
|
510 | $queue->[1] /= $fudge; |
|
|
511 | $queue->[1] = $queue->[1] * $::wait_factor |
|
|
512 | + ($::NOW - $self->{time}) * (1 - $::wait_factor); |
|
|
513 | } |
|
|
514 | $self->{time} = $::NOW; |
|
|
515 | |
|
|
516 | $self->{fh}->writable or return; |
|
|
517 | |
544 | |
518 | my ($fh, $buf, $r); |
545 | my ($fh, $buf, $r); |
519 | my $current = $Coro::current; |
546 | |
520 | open $fh, "<", $self->{path} |
547 | open $fh, "<", $self->{path} |
521 | or die "$self->{path}: late open failure ($!)"; |
548 | or die "$self->{path}: late open failure ($!)"; |
522 | |
549 | |
523 | $h -= $l - 1; |
550 | $h -= $l - 1; |
524 | |
551 | |
525 | if (0) { |
552 | if (0) { # !AIO |
526 | if ($l) { |
553 | if ($l) { |
527 | sysseek $fh, $l, 0; |
554 | sysseek $fh, $l, 0; |
528 | } |
555 | } |
529 | } |
556 | } |
|
|
557 | |
|
|
558 | my $transfer = $queue->start_transfer($h); |
|
|
559 | my $locked; |
|
|
560 | my $bufsize = $::WAIT_BUFSIZE; # initial buffer size |
530 | |
561 | |
531 | while ($h > 0) { |
562 | while ($h > 0) { |
|
|
563 | unless ($locked) { |
|
|
564 | if ($locked ||= $transfer->try($::WAIT_INTERVAL)) { |
|
|
565 | $bufsize = $::BUFSIZE; |
|
|
566 | $self->{time} = $::NOW; |
|
|
567 | } |
|
|
568 | } |
|
|
569 | |
|
|
570 | if ($blocked{$self->{remote_id}}) { |
|
|
571 | $self->{h}{connection} = "close"; |
|
|
572 | die bless {}, err::; |
|
|
573 | } |
|
|
574 | |
532 | if (0) { |
575 | if (0) { # !AIO |
533 | sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h |
576 | sysread $fh, $buf, $h > $bufsize ? $bufsize : $h |
534 | or last; |
577 | or last; |
535 | } else { |
578 | } else { |
536 | aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), |
579 | aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h), |
537 | $buf, 0, sub { |
580 | $buf, 0, sub { |
538 | $r = $_[0]; |
581 | $r = $_[0]; |
539 | Coro::ready($current); |
582 | Coro::ready($current); |
540 | }); |
583 | }); |
541 | &Coro::schedule; |
584 | &Coro::schedule; |