ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing cvsroot/Coro/myhttpd/httpd.pl (file contents):
Revision 1.44 by root, Fri Sep 14 12:38:18 2001 UTC vs.
Revision 1.80 by root, Fri Dec 1 04:18:32 2006 UTC

1use Coro; 1use Coro;
2use Coro::Semaphore; 2use Coro::Semaphore;
3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5use Coro::Signal; 5use Coro::Signal;
6use Coro::AIO ();
6 7
7use HTTP::Date; 8use HTTP::Date;
9use POSIX ();
10
11use Compress::Zlib ();
8 12
9no utf8; 13no utf8;
10use bytes; 14use bytes;
11 15
12# at least on my machine, this thingy serves files 16# at least on my machine, this thingy serves files
14# and quite a bit slower than thttpd :( 18# and quite a bit slower than thttpd :(
15 19
16$SIG{PIPE} = 'IGNORE'; 20$SIG{PIPE} = 'IGNORE';
17 21
18our $accesslog; 22our $accesslog;
23our $errorlog;
24
25our $NOW;
26our $HTTP_NOW;
27
28our $ERROR_LOG;
29our $ACCESS_LOG;
30
31Event->timer(interval => 1, hard => 1, cb => sub {
32 $NOW = time;
33 $HTTP_NOW = time2str $NOW;
34})->now;
35
36if ($ERROR_LOG) {
37 use IO::Handle;
38 open $errorlog, ">>$ERROR_LOG"
39 or die "$ERROR_LOG: $!";
40 $errorlog->autoflush(1);
41}
19 42
20if ($ACCESS_LOG) { 43if ($ACCESS_LOG) {
21 use IO::Handle; 44 use IO::Handle;
22 open $accesslog, ">>$ACCESS_LOG" 45 open $accesslog, ">>$ACCESS_LOG"
23 or die "$ACCESS_LOG: $!"; 46 or die "$ACCESS_LOG: $!";
25} 48}
26 49
27sub slog { 50sub slog {
28 my $level = shift; 51 my $level = shift;
29 my $format = shift; 52 my $format = shift;
53 my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW);
30 printf "---: $format\n", @_; 54 printf "$NOW: $format\n", @_;
55 printf $errorlog "$NOW: $format\n", @_ if $errorlog;
31} 56}
32 57
33our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; 58our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
34our $httpevent = new Coro::Signal; 59our $httpevent = new Coro::Signal;
35 60
36our $wait_factor = 0.95; 61our $queue_file = new transferqueue $MAX_TRANSFERS;
62our $queue_index = new transferqueue 10;
37 63
38our @transfers = ( 64our $tbf_top = new tbf rate => $TBF_RATE || 100000;
39 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1], 65
40 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1], 66my $unused_bytes = 0;
41); 67my $unused_last = time;
68
69sub unused_bandwidth {
70 $unused_bytes += $_[0];
71 if ($unused_last < $NOW - 30 && $unused_bytes / ($NOW - $unused_last) > 50000) {
72 $unused_last = $NOW;
73 $unused_bytes = 0;
74 $queue_file->force_wake_next;
75 slog 1, "forced filetransfer due to unused bandwidth";
76 }
77}
42 78
43my @newcons; 79my @newcons;
44my @pool; 80my @pool;
45 81
46# one "execution thread" 82# one "execution thread"
49 if (@newcons) { 85 if (@newcons) {
50 eval { 86 eval {
51 conn->new(@{pop @newcons})->handle; 87 conn->new(@{pop @newcons})->handle;
52 }; 88 };
53 slog 1, "$@" if $@ && !ref $@; 89 slog 1, "$@" if $@ && !ref $@;
90
91 $httpevent->broadcast; # only for testing, but doesn't matter much
92
54 $connections->up; 93 $connections->up;
55 } else { 94 } else {
56 last if @pool >= $MAX_POOL; 95 last if @pool >= $MAX_POOL;
57 push @pool, $Coro::current; 96 push @pool, $Coro::current;
58 schedule; 97 schedule;
75 if (@pool) { 114 if (@pool) {
76 (pop @pool)->ready; 115 (pop @pool)->ready;
77 } else { 116 } else {
78 async \&handler; 117 async \&handler;
79 } 118 }
80
81 } 119 }
82 }; 120 };
83} 121}
84 122
85my $http_port = new Coro::Socket 123my $http_port = new Coro::Socket
100 or die "unable to start server"; 138 or die "unable to start server";
101 139
102 listen_on $http_port; 140 listen_on $http_port;
103} 141}
104 142
105our $NOW;
106our $HTTP_NOW;
107
108Event->timer(interval => 1, hard => 1, cb => sub {
109 $NOW = time;
110 $HTTP_NOW = time2str $NOW;
111})->now;
112
113package conn; 143package conn;
144
145use strict;
146use bytes;
114 147
115use Socket; 148use Socket;
116use HTTP::Date; 149use HTTP::Date;
117use Convert::Scalar 'weaken'; 150use Convert::Scalar 'weaken';
118use Linux::AIO; 151use IO::AIO;
119 152
120Linux::AIO::min_parallel $::AIO_PARALLEL; 153IO::AIO::min_parallel $::AIO_PARALLEL;
121 154
122Event->io(fd => Linux::AIO::poll_fileno, 155Event->io (fd => IO::AIO::poll_fileno,
123 poll => 'r', async => 1, 156 poll => 'r', async => 1,
124 cb => \&Linux::AIO::poll_cb); 157 cb => \&IO::AIO::poll_cb);
125 158
126our %conn; # $conn{ip}{self} => connobj 159our %conn; # $conn{ip}{self} => connobj
127our %uri; # $uri{ip}{uri}{self} 160our %uri; # $uri{ip}{uri}{self}
128our %blocked; 161our %blocked;
129our %mimetype; 162our %mimetype;
149 my $peername = shift; 182 my $peername = shift;
150 my $self = bless { fh => $fh }, $class; 183 my $self = bless { fh => $fh }, $class;
151 my (undef, $iaddr) = unpack_sockaddr_in $peername 184 my (undef, $iaddr) = unpack_sockaddr_in $peername
152 or $self->err(500, "unable to decode peername"); 185 or $self->err(500, "unable to decode peername");
153 186
187 $self->{remote_addr} =
154 $self->{remote_addr} = inet_ntoa $iaddr; 188 $self->{remote_id} = inet_ntoa $iaddr;
189
155 $self->{time} = $::NOW; 190 $self->{time} = $::NOW;
156 191
192 weaken ($Coro::current->{conn} = $self);
193
157 $::conns++; 194 $::conns++;
195 $::maxconns = $::conns if $::conns > $::maxconns;
158 196
159 $self; 197 $self;
160} 198}
161 199
162sub DESTROY { 200sub DESTROY {
163 my $self = shift; 201 #my $self = shift;
164 $::conns--; 202 $::conns--;
165 $self->eoconn;
166} 203}
167 204
168# end of connection 205sub prune_cache {
169sub eoconn { 206 my $hash = $_[0];
170 my $self = shift;
171 207
172 # clean up hints 208 for (keys %$hash) {
173 delete $conn{$self->{remote_id}}{$self*1}; 209 if (ref $hash->{$_} eq HASH::) {
174 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1}; 210 prune_cache($hash->{$_});
175 211 unless (scalar keys %{$hash->{$_}}) {
176 $httpevent->broadcast; 212 delete $hash->{$_};
213 }
214 }
215 }
177} 216}
217
218sub prune_caches {
219 prune_cache \%conn;
220 prune_cache \%uri;
221
222 for (keys %blocked) {
223 delete $blocked{$_} unless $blocked{$_}[0] > $::NOW;
224 }
225}
226
227Event->timer(interval => 60, cb => \&prune_caches);
178 228
179sub slog { 229sub slog {
180 my $self = shift; 230 my $self = shift;
181 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); 231 main::slog($_[0], "$self->{remote_id}> $_[1]");
182} 232}
183 233
184sub response { 234sub response {
185 my ($self, $code, $msg, $hdr, $content) = @_; 235 my ($self, $code, $msg, $hdr, $content) = @_;
186 my $res = "HTTP/1.1 $code $msg\015\012"; 236 my $res = "HTTP/1.1 $code $msg\015\012";
237 my $GZ = "";
187 238
188 $self->{h}{connection} = "close" if $hdr->{Connection} =~ /close/; 239 if (exists $hdr->{Connection}) {
240 if ($hdr->{Connection} =~ /close/) {
241 $self->{h}{connection} = "close"
242 }
243 } else {
244 if ($self->{version} < 1.1) {
245 if ($self->{h}{connection} =~ /keep-alive/i) {
246 $hdr->{Connection} = "Keep-Alive";
247 } else {
248 $self->{h}{connection} = "close"
249 }
250 }
251 }
252
253 if ($self->{method} ne "HEAD"
254 && $self->{h}{"accept-encoding"} =~ /\bgzip\b/
255 && 400 < length $content
256 && $hdr->{"Content-Length"} == length $content
257 && !exists $hdr->{"Content-Encoding"}
258 ) {
259 my $orig = length $content;
260 $hdr->{"Content-Encoding"} = "gzip";
261 $content = Compress::Zlib::memGzip(\$content);
262 $hdr->{"Content-Length"} = length $content;
263 $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig);
264 }
189 265
190 $res .= "Date: $HTTP_NOW\015\012"; 266 $res .= "Date: $HTTP_NOW\015\012";
267 $res .= "Server: $::NAME\015\012";
191 268
192 while (my ($h, $v) = each %$hdr) { 269 while (my ($h, $v) = each %$hdr) {
193 $res .= "$h: $v\015\012" 270 $res .= "$h: $v\015\012"
194 } 271 }
195 $res .= "\015\012"; 272 $res .= "\015\012";
196 273
197 $res .= $content if defined $content and $self->{method} ne "HEAD"; 274 $res .= $content if defined $content and $self->{method} ne "HEAD";
198 275
199 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; 276 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW).
277 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ.
278 " \"$self->{h}{referer}\"\n";
200 279
201 print $accesslog $log if $accesslog; 280 print $::accesslog $log if $::accesslog;
202 print STDERR $log; 281 print STDERR $log;
203 282
204 $self->{written} += 283 $tbf_top->request(length $res, 1e6);
205 print {$self->{fh}} $res; 284 $self->{written} += print {$self->{fh}} $res;
206} 285}
207 286
208sub err { 287sub err {
209 my $self = shift; 288 my $self = shift;
210 my ($code, $msg, $hdr, $content) = @_; 289 my ($code, $msg, $hdr, $content) = @_;
265 my (%hdr, $h, $v); 344 my (%hdr, $h, $v);
266 345
267 $hdr{lc $1} .= ",$2" 346 $hdr{lc $1} .= ",$2"
268 while $req =~ /\G 347 while $req =~ /\G
269 ([^:\000-\040]+): 348 ([^:\000-\040]+):
270 [\008\040]* 349 [\011\040]*
271 ((?: [^\015\012]+ | \015\012[\008\040] )*) 350 ((?: [^\015\012]+ | \015\012[\011\040] )*)
272 \015\012 351 \015\012
273 /gxc; 352 /gxc;
274 353
275 $req =~ /\G\015\012$/ 354 $req =~ /\G\015\012$/
276 or $self->err(400, "bad request"); 355 or $self->err(400, "bad request");
288 $id .= "[".$self->{h}{"x-forwarded-for"}."]"; 367 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
289 } 368 }
290 369
291 $self->{remote_id} = $id; 370 $self->{remote_id} = $id;
292 371
372 weaken (local $conn{$id}{$self*1} = $self);
373
293 if ($blocked{$id}) { 374 if ($blocked{$id}) {
294 $self->err_blocked($blocked{$id}) 375 $self->err_blocked
295 if $blocked{$id} > $::NOW; 376 if $blocked{$id}[0] > $::NOW;
296 377
297 delete $blocked{$id}; 378 delete $blocked{$id};
298 }
299
300 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
301 my $delay = $::PER_TIMEOUT + $::NOW + 15;
302 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
303 if ($delay < $::NOW) {
304 $self->slog(2, "blocked ip $id");
305 $self->err_blocked;
306 } else {
307 $httpevent->wait;
308 }
309 }
310 } 379 }
311 380
312 # find out server name and port 381 # find out server name and port
313 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { 382 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
314 $host = $1; 383 $host = $1;
325 $host = inet_ntoa $host; 394 $host = inet_ntoa $host;
326 } 395 }
327 396
328 $self->{server_name} = $host; 397 $self->{server_name} = $host;
329 398
330 # enter ourselves into various lists
331 weaken ($conn{$id}{$self*1} = $self);
332 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self); 399 weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self);
333 400
334 eval { 401 eval {
335 $self->map_uri; 402 $self->map_uri;
336 $self->respond; 403 $self->respond;
337 }; 404 };
338 405
339 $self->eoconn;
340
341 die if $@ && !ref $@; 406 die if $@ && !ref $@;
342 407
343 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1; 408 last if $self->{h}{connection} =~ /close/i;
344 409
345 $httpevent->broadcast; 410 $httpevent->broadcast;
346 411
347 $fh->timeout($::PER_TIMEOUT); 412 $fh->timeout($::PER_TIMEOUT);
348 } 413 }
414}
415
416sub block {
417 my $self = shift;
418
419 $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]];
420 $self->slog(2, "blocked ip $self->{remote_id}");
421 $self->err_blocked;
349} 422}
350 423
351# uri => path mapping 424# uri => path mapping
352sub map_uri { 425sub map_uri {
353 my $self = shift; 426 my $self = shift;
400 473
401sub respond { 474sub respond {
402 my $self = shift; 475 my $self = shift;
403 my $path = $self->{path}; 476 my $path = $self->{path};
404 477
405 stat $path 478 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
406 or $self->err(404, "not found"); 479 if ($::internal{$1}) {
407 480 $::internal{$1}->($self);
408 $self->{stat} = [stat _];
409
410 # idiotic netscape sends idiotic headers AGAIN
411 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
412 ? str2time $1 : 0;
413
414 if (-d _ && -r _) {
415 # directory
416 if ($path !~ /\/$/) {
417 # create a redirect to get the trailing "/"
418 # we don't try to avoid the :80
419 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
420 } else { 481 } else {
421 $ims < $self->{stat}[9] 482 $self->err(404, "not found");
483 }
484 } else {
485
486 stat $path
422 or $self->err(304, "not modified"); 487 or $self->err(404, "not found");
423 488
424 if (-r "$path/index.html") { 489 $self->{stat} = [stat _];
425 $self->{path} .= "/index.html"; 490
426 $self->handle_file; 491 # idiotic netscape sends idiotic headers AGAIN
492 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
493 ? str2time $1 : 0;
494
495 if (-d _ && -r _) {
496 # directory
497 if ($path !~ /\/$/) {
498 # create a redirect to get the trailing "/"
499 # we don't try to avoid the :80
500 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
427 } else { 501 } else {
502 $ims < $self->{stat}[9]
503 or $self->err(304, "not modified");
504
505 if (-r "$path/index.html") {
506 # replace directory "size" by index.html filesize
507 $self->{stat} = [stat ($self->{path} .= "/index.html")];
508 $self->handle_file($queue_index, $tbf_top);
509 } else {
428 $self->handle_dir; 510 $self->handle_dir;
429 } 511 }
430 } 512 }
431 } elsif (-f _ && -r _) { 513 } elsif (-f _ && -r _) {
432 -x _ and $self->err(403, "forbidden"); 514 -x _ and $self->err(403, "forbidden");
433 $self->handle_file; 515
516 if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
517 my $timeout = $::NOW + 10;
518 while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
519 if ($timeout < $::NOW) {
520 $self->block($::BLOCKTIME, "too many connections");
521 } else {
522 $httpevent->wait;
523 }
524 }
525 }
526
527 $self->handle_file($queue_file, $tbf_top);
434 } else { 528 } else {
435 $self->err(404, "not found"); 529 $self->err(404, "not found");
530 }
436 } 531 }
437} 532}
438 533
439sub handle_dir { 534sub handle_dir {
440 my $self = shift; 535 my $self = shift;
441 my $idx = $self->diridx; 536 my $idx = $self->diridx;
442 537
443 $self->response(200, "ok", 538 $self->response(200, "ok",
444 { 539 {
445 "Content-Type" => "text/html", 540 "Content-Type" => "text/html; charset=utf-8",
446 "Content-Length" => length $idx, 541 "Content-Length" => length $idx,
542 "Last-Modified" => time2str ($self->{stat}[9]),
447 }, 543 },
448 $idx); 544 $idx);
449} 545}
450 546
451sub handle_file { 547sub handle_file {
452 my $self = shift; 548 my ($self, $queue, $tbf) = @_;
453 my $length = $self->{stat}[7]; 549 my $length = $self->{stat}[7];
454 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
455 my $hdr = { 550 my $hdr = {
456 "Last-Modified" => time2str ((stat _)[9]), 551 "Last-Modified" => time2str ((stat _)[9]),
552 "Accept-Ranges" => "bytes",
457 }; 553 };
458 554
459 my @code = (200, "ok"); 555 my @code = (200, "ok");
460 my ($l, $h); 556 my ($l, $h);
461 557
476 $self->err(416, "not satisfiable", $hdr, ""); 572 $self->err(416, "not satisfiable", $hdr, "");
477 573
478satisfiable: 574satisfiable:
479 # check for segmented downloads 575 # check for segmented downloads
480 if ($l && $::NO_SEGMENTED) { 576 if ($l && $::NO_SEGMENTED) {
481 my $delay = $::NOW + $::PER_TIMEOUT + 15; 577 my $timeout = $::NOW + 15;
482 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { 578 while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
483 if ($delay <= $::NOW) { 579 if ($timeout <= $::NOW) {
580 $self->block($::BLOCKTIME, "segmented downloads are forbidden");
484 $self->err_segmented_download; 581 #$self->err_segmented_download;
485 } else { 582 } else {
486 $httpevent->broadcast; 583 $httpevent->wait;
487 } 584 }
488 } 585 }
489 } 586 }
490 587
491 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 588 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
503 600
504 $self->response(@code, $hdr, ""); 601 $self->response(@code, $hdr, "");
505 602
506 if ($self->{method} eq "GET") { 603 if ($self->{method} eq "GET") {
507 $self->{time} = $::NOW; 604 $self->{time} = $::NOW;
508
509 my $fudge = $queue->[0]->waiters;
510 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
511
512 $queue->[1] *= $fudge;
513 my $transfer = $queue->[0]->guard;
514
515 if ($fudge != 1) {
516 $queue->[1] /= $fudge;
517 $queue->[1] = $queue->[1] * $::wait_factor
518 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
519 }
520 $self->{time} = $::NOW; 605 $self->{written} = 0;
521 606
522 $self->{fh}->writable or return; 607 my $fh;
523 608
524 my ($fh, $buf, $r);
525 my $current = $Coro::current;
526 open $fh, "<", $self->{path} 609 open $fh, "<", $self->{path}
527 or die "$self->{path}: late open failure ($!)"; 610 or die "$self->{path}: late open failure ($!)";
528 611
529 $h -= $l - 1; 612 $h -= $l - 1;
530 613
531 if (0) { 614 if (0) { # !AIO
532 if ($l) { 615 if ($l) {
533 sysseek $fh, $l, 0; 616 sysseek $fh, $l, 0;
534 } 617 }
535 } 618 }
619
620 my $transfer = $queue->start_transfer($h);
621 my $locked;
622 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
536 623
537 while ($h > 0) { 624 while ($h > 0) {
538 if (0) { 625 unless ($locked) {
539 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h 626 if ($locked ||= $transfer->try($::WAIT_INTERVAL)) {
627 $bufsize = $::BUFSIZE;
628 $self->{time} = $::NOW;
629 $self->{written} = 0;
630 }
631 }
632
633 if ($blocked{$self->{remote_id}}) {
634 $self->{h}{connection} = "close";
635 die bless {}, err::;
636 }
637
638 Coro::AIO::aio_read $fh, $l, ($h > $bufsize ? $bufsize : $h), my $buf, 0
540 or last; 639 or last;
541 } else { 640
542 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), 641 $tbf->request (length $buf);
543 $buf, 0, sub {
544 $r = $_[0];
545 Coro::ready($current);
546 });
547 &Coro::schedule;
548 last unless $r;
549 }
550 my $w = syswrite $self->{fh}, $buf 642 my $w = syswrite $self->{fh}, $buf
551 or last; 643 or last;
552 $::written += $w; 644 $::written += $w;
553 $self->{written} += $w; 645 $self->{written} += $w;
554 $l += $r; 646 $l += $w;
555 } 647 }
556 648
557 close $fh; 649 close $fh;
558 } 650 }
559} 651}
560 652
5611; 6531
654

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines