ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing Coro/myhttpd/httpd.pl (file contents):
Revision 1.47 by root, Tue Nov 20 01:56:21 2001 UTC vs.
Revision 1.67 by root, Sun May 19 21:00:47 2002 UTC

5use Coro::Signal; 5use Coro::Signal;
6 6
7use HTTP::Date; 7use HTTP::Date;
8use POSIX (); 8use POSIX ();
9 9
10use Compress::Zlib ();
11
10no utf8; 12no utf8;
11use bytes; 13use bytes;
12 14
13# at least on my machine, this thingy serves files 15# at least on my machine, this thingy serves files
14# quite a bit faster than apache, ;) 16# quite a bit faster than apache, ;)
15# and quite a bit slower than thttpd :( 17# and quite a bit slower than thttpd :(
16 18
17$SIG{PIPE} = 'IGNORE'; 19$SIG{PIPE} = 'IGNORE';
18 20
19our $accesslog; 21our $accesslog;
22our $errorlog;
23
24our $NOW;
25our $HTTP_NOW;
26
27Event->timer(interval => 1, hard => 1, cb => sub {
28 $NOW = time;
29 $HTTP_NOW = time2str $NOW;
30})->now;
31
32if ($ERROR_LOG) {
33 use IO::Handle;
34 open $errorlog, ">>$ERROR_LOG"
35 or die "$ERROR_LOG: $!";
36 $errorlog->autoflush(1);
37}
20 38
21if ($ACCESS_LOG) { 39if ($ACCESS_LOG) {
22 use IO::Handle; 40 use IO::Handle;
23 open $accesslog, ">>$ACCESS_LOG" 41 open $accesslog, ">>$ACCESS_LOG"
24 or die "$ACCESS_LOG: $!"; 42 or die "$ACCESS_LOG: $!";
26} 44}
27 45
28sub slog { 46sub slog {
29 my $level = shift; 47 my $level = shift;
30 my $format = shift; 48 my $format = shift;
49 my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW);
31 printf "---: $format\n", @_; 50 printf "$NOW: $format\n", @_;
51 printf $errorlog "$NOW: $format\n", @_ if $errorlog;
32} 52}
33 53
34our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; 54our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
35our $httpevent = new Coro::Signal; 55our $httpevent = new Coro::Signal;
36 56
37our $wait_factor = 0.95; 57our $queue_file = new transferqueue $MAX_TRANSFERS;
58our $queue_index = new transferqueue 10;
38 59
39our @transfers = ( 60our $tbf_top = new tbf rate => 200000;
40 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1],
41 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1],
42);
43 61
44my @newcons; 62my @newcons;
45my @pool; 63my @pool;
46 64
47# one "execution thread" 65# one "execution thread"
50 if (@newcons) { 68 if (@newcons) {
51 eval { 69 eval {
52 conn->new(@{pop @newcons})->handle; 70 conn->new(@{pop @newcons})->handle;
53 }; 71 };
54 slog 1, "$@" if $@ && !ref $@; 72 slog 1, "$@" if $@ && !ref $@;
73
74 $httpevent->broadcast; # only for testing, but doesn't matter much
75
55 $connections->up; 76 $connections->up;
56 } else { 77 } else {
57 last if @pool >= $MAX_POOL; 78 last if @pool >= $MAX_POOL;
58 push @pool, $Coro::current; 79 push @pool, $Coro::current;
59 schedule; 80 schedule;
101 or die "unable to start server"; 122 or die "unable to start server";
102 123
103 listen_on $http_port; 124 listen_on $http_port;
104} 125}
105 126
106our $NOW;
107our $HTTP_NOW;
108
109Event->timer(interval => 1, hard => 1, cb => sub {
110 $NOW = time;
111 $HTTP_NOW = time2str $NOW;
112})->now;
113
114package conn; 127package conn;
115 128
116use Socket; 129use Socket;
117use HTTP::Date; 130use HTTP::Date;
118use Convert::Scalar 'weaken'; 131use Convert::Scalar 'weaken';
150 my $peername = shift; 163 my $peername = shift;
151 my $self = bless { fh => $fh }, $class; 164 my $self = bless { fh => $fh }, $class;
152 my (undef, $iaddr) = unpack_sockaddr_in $peername 165 my (undef, $iaddr) = unpack_sockaddr_in $peername
153 or $self->err(500, "unable to decode peername"); 166 or $self->err(500, "unable to decode peername");
154 167
168 $self->{remote_addr} =
155 $self->{remote_addr} = inet_ntoa $iaddr; 169 $self->{remote_id} = inet_ntoa $iaddr;
170
156 $self->{time} = $::NOW; 171 $self->{time} = $::NOW;
157 172
173 weaken ($Coro::current->{conn} = $self);
174
158 $::conns++; 175 $::conns++;
176 $::maxconns = $::conns if $::conns > $::maxconns;
159 177
160 $self; 178 $self;
161} 179}
162 180
163sub DESTROY { 181sub DESTROY {
164 my $self = shift; 182 #my $self = shift;
165 $::conns--; 183 $::conns--;
166 $self->eoconn;
167}
168
169# end of connection
170sub eoconn {
171 my $self = shift;
172
173 # clean up hints
174 delete $conn{$self->{remote_id}}{$self*1};
175 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1};
176
177 $httpevent->broadcast;
178} 184}
179 185
180sub slog { 186sub slog {
181 my $self = shift; 187 my $self = shift;
182 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); 188 main::slog($_[0], "$self->{remote_id}> $_[1]");
183} 189}
184 190
185sub response { 191sub response {
186 my ($self, $code, $msg, $hdr, $content) = @_; 192 my ($self, $code, $msg, $hdr, $content) = @_;
187 my $res = "HTTP/1.1 $code $msg\015\012"; 193 my $res = "HTTP/1.1 $code $msg\015\012";
194 my $GZ = "";
188 195
189 if (exists $hdr->{Connection}) { 196 if (exists $hdr->{Connection}) {
190 if ($hdr->{Connection} =~ /close/) { 197 if ($hdr->{Connection} =~ /close/) {
191 $self->{h}{connection} = "close" 198 $self->{h}{connection} = "close"
192 } 199 }
198 $self->{h}{connection} = "close" 205 $self->{h}{connection} = "close"
199 } 206 }
200 } 207 }
201 } 208 }
202 209
210 if ($self->{method} ne "HEAD"
211 && $self->{h}{"accept-encoding"} =~ /\bgzip\b/
212 && 400 < length $content
213 && $hdr->{"Content-Length"} == length $content
214 && !exists $hdr->{"Content-Encoding"}
215 ) {
216 my $orig = length $content;
217 $hdr->{"Content-Encoding"} = "gzip";
218 $content = Compress::Zlib::memGzip(\$content);
219 $hdr->{"Content-Length"} = length $content;
220 $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig);
221 }
222
203 $res .= "Date: $HTTP_NOW\015\012"; 223 $res .= "Date: $HTTP_NOW\015\012";
204 224
205 while (my ($h, $v) = each %$hdr) { 225 while (my ($h, $v) = each %$hdr) {
206 $res .= "$h: $v\015\012" 226 $res .= "$h: $v\015\012"
207 } 227 }
208 $res .= "\015\012"; 228 $res .= "\015\012";
209 229
210 $res .= $content if defined $content and $self->{method} ne "HEAD"; 230 $res .= $content if defined $content and $self->{method} ne "HEAD";
211 231
212 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $NOW). 232 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW).
213 " $self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; 233 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ.
234 " \"$self->{h}{referer}\"\n";
214 235
215 print $accesslog $log if $accesslog; 236 print $::accesslog $log if $::accesslog;
216 print STDERR $log; 237 print STDERR $log;
217 238
218 $self->{written} += 239 $tbf_top->request(length $res, 1e6);
219 print {$self->{fh}} $res; 240 $self->{written} += print {$self->{fh}} $res;
220} 241}
221 242
222sub err { 243sub err {
223 my $self = shift; 244 my $self = shift;
224 my ($code, $msg, $hdr, $content) = @_; 245 my ($code, $msg, $hdr, $content) = @_;
279 my (%hdr, $h, $v); 300 my (%hdr, $h, $v);
280 301
281 $hdr{lc $1} .= ",$2" 302 $hdr{lc $1} .= ",$2"
282 while $req =~ /\G 303 while $req =~ /\G
283 ([^:\000-\040]+): 304 ([^:\000-\040]+):
284 [\008\040]* 305 [\011\040]*
285 ((?: [^\015\012]+ | \015\012[\008\040] )*) 306 ((?: [^\015\012]+ | \015\012[\011\040] )*)
286 \015\012 307 \015\012
287 /gxc; 308 /gxc;
288 309
289 $req =~ /\G\015\012$/ 310 $req =~ /\G\015\012$/
290 or $self->err(400, "bad request"); 311 or $self->err(400, "bad request");
302 $id .= "[".$self->{h}{"x-forwarded-for"}."]"; 323 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
303 } 324 }
304 325
305 $self->{remote_id} = $id; 326 $self->{remote_id} = $id;
306 327
328 weaken (local $conn{$id}{$self*1} = $self);
329
307 if ($blocked{$id}) { 330 if ($blocked{$id}) {
308 $self->err_blocked($blocked{$id}) 331 $self->err_blocked
309 if $blocked{$id} > $::NOW; 332 if $blocked{$id}[0] > $::NOW;
310 333
311 delete $blocked{$id}; 334 delete $blocked{$id};
312 }
313
314 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
315 my $delay = $::PER_TIMEOUT + $::NOW + 15;
316 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
317 if ($delay < $::NOW) {
318 $self->slog(2, "blocked ip $id");
319 $self->err_blocked;
320 } else {
321 $httpevent->wait;
322 }
323 }
324 } 335 }
325 336
326 # find out server name and port 337 # find out server name and port
327 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { 338 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
328 $host = $1; 339 $host = $1;
339 $host = inet_ntoa $host; 350 $host = inet_ntoa $host;
340 } 351 }
341 352
342 $self->{server_name} = $host; 353 $self->{server_name} = $host;
343 354
344 # enter ourselves into various lists
345 weaken ($conn{$id}{$self*1} = $self);
346 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self); 355 weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self);
347 356
348 eval { 357 eval {
349 $self->map_uri; 358 $self->map_uri;
350 $self->respond; 359 $self->respond;
351 }; 360 };
352 361
353 $self->eoconn;
354
355 die if $@ && !ref $@; 362 die if $@ && !ref $@;
356 363
357 last if $self->{h}{connection} =~ /close/; 364 last if $self->{h}{connection} =~ /close/i;
358 365
359 $httpevent->broadcast; 366 $httpevent->broadcast;
360 367
361 $fh->timeout($::PER_TIMEOUT); 368 $fh->timeout($::PER_TIMEOUT);
362 } 369 }
370}
371
372sub block {
373 my $self = shift;
374
375 $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]];
376 $self->slog(2, "blocked ip $self->{remote_id}");
377 $self->err_blocked;
363} 378}
364 379
365# uri => path mapping 380# uri => path mapping
366sub map_uri { 381sub map_uri {
367 my $self = shift; 382 my $self = shift;
414 429
415sub respond { 430sub respond {
416 my $self = shift; 431 my $self = shift;
417 my $path = $self->{path}; 432 my $path = $self->{path};
418 433
419 stat $path 434 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
420 or $self->err(404, "not found"); 435 if ($::internal{$1}) {
421 436 $::internal{$1}->($self);
422 $self->{stat} = [stat _];
423
424 # idiotic netscape sends idiotic headers AGAIN
425 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
426 ? str2time $1 : 0;
427
428 if (-d _ && -r _) {
429 # directory
430 if ($path !~ /\/$/) {
431 # create a redirect to get the trailing "/"
432 # we don't try to avoid the :80
433 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
434 } else { 437 } else {
435 $ims < $self->{stat}[9] 438 $self->err(404, "not found");
439 }
440 } else {
441
442 stat $path
436 or $self->err(304, "not modified"); 443 or $self->err(404, "not found");
437 444
438 if (-r "$path/index.html") { 445 $self->{stat} = [stat _];
439 # replace directory "size" by index.html filesize 446
440 $self->{stat}[7] = (stat ($self->{path} .= "/index.html"))[7]; 447 # idiotic netscape sends idiotic headers AGAIN
441 $self->handle_file; 448 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
449 ? str2time $1 : 0;
450
451 if (-d _ && -r _) {
452 # directory
453 if ($path !~ /\/$/) {
454 # create a redirect to get the trailing "/"
455 # we don't try to avoid the :80
456 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
442 } else { 457 } else {
458 $ims < $self->{stat}[9]
459 or $self->err(304, "not modified");
460
461 if (-r "$path/index.html") {
462 # replace directory "size" by index.html filesize
463 $self->{stat} = [stat ($self->{path} .= "/index.html")];
464 $self->handle_file($queue_index, $tbf_top);
465 } else {
443 $self->handle_dir; 466 $self->handle_dir;
444 } 467 }
445 } 468 }
446 } elsif (-f _ && -r _) { 469 } elsif (-f _ && -r _) {
447 -x _ and $self->err(403, "forbidden"); 470 -x _ and $self->err(403, "forbidden");
448 $self->handle_file; 471
472 if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
473 my $timeout = $::NOW + 10;
474 while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
475 if ($timeout < $::NOW) {
476 $self->block($::BLOCKTIME, "too many connections");
477 } else {
478 $httpevent->wait;
479 }
480 }
481 }
482
483 $self->handle_file($queue_file, $tbf_top);
449 } else { 484 } else {
450 $self->err(404, "not found"); 485 $self->err(404, "not found");
486 }
451 } 487 }
452} 488}
453 489
454sub handle_dir { 490sub handle_dir {
455 my $self = shift; 491 my $self = shift;
457 493
458 $self->response(200, "ok", 494 $self->response(200, "ok",
459 { 495 {
460 "Content-Type" => "text/html", 496 "Content-Type" => "text/html",
461 "Content-Length" => length $idx, 497 "Content-Length" => length $idx,
462 "Last-Modified" => time2str ((stat _)[9]), 498 "Last-Modified" => time2str ($self->{stat}[9]),
463 }, 499 },
464 $idx); 500 $idx);
465} 501}
466 502
467sub handle_file { 503sub handle_file {
468 my $self = shift; 504 my ($self, $queue, $tbf) = @_;
469 my $length = $self->{stat}[7]; 505 my $length = $self->{stat}[7];
470 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
471 my $hdr = { 506 my $hdr = {
472 "Last-Modified" => time2str ((stat _)[9]), 507 "Last-Modified" => time2str ((stat _)[9]),
473 }; 508 };
474 509
475 my @code = (200, "ok"); 510 my @code = (200, "ok");
492 $self->err(416, "not satisfiable", $hdr, ""); 527 $self->err(416, "not satisfiable", $hdr, "");
493 528
494satisfiable: 529satisfiable:
495 # check for segmented downloads 530 # check for segmented downloads
496 if ($l && $::NO_SEGMENTED) { 531 if ($l && $::NO_SEGMENTED) {
497 my $delay = $::NOW + $::PER_TIMEOUT + 15; 532 my $timeout = $::NOW + 15;
498 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { 533 while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
499 if ($delay <= $::NOW) { 534 if ($timeout <= $::NOW) {
535 $self->block($::BLOCKTIME, "segmented downloads are forbidden");
500 $self->err_segmented_download; 536 #$self->err_segmented_download;
501 } else { 537 } else {
502 $httpevent->wait; 538 $httpevent->wait;
503 } 539 }
504 } 540 }
505 } 541 }
520 $self->response(@code, $hdr, ""); 556 $self->response(@code, $hdr, "");
521 557
522 if ($self->{method} eq "GET") { 558 if ($self->{method} eq "GET") {
523 $self->{time} = $::NOW; 559 $self->{time} = $::NOW;
524 560
525 my $fudge = $queue->[0]->waiters; 561 my $current = $Coro::current;
526 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
527
528 $queue->[1] *= $fudge;
529 my $transfer = $queue->[0]->guard;
530
531 if ($fudge != 1) {
532 $queue->[1] /= $fudge;
533 $queue->[1] = $queue->[1] * $::wait_factor
534 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
535 }
536 $self->{time} = $::NOW;
537
538 $self->{fh}->writable or return;
539 562
540 my ($fh, $buf, $r); 563 my ($fh, $buf, $r);
541 my $current = $Coro::current; 564
542 open $fh, "<", $self->{path} 565 open $fh, "<", $self->{path}
543 or die "$self->{path}: late open failure ($!)"; 566 or die "$self->{path}: late open failure ($!)";
544 567
545 $h -= $l - 1; 568 $h -= $l - 1;
546 569
547 if (0) { 570 if (0) { # !AIO
548 if ($l) { 571 if ($l) {
549 sysseek $fh, $l, 0; 572 sysseek $fh, $l, 0;
550 } 573 }
551 } 574 }
575
576 my $transfer = $queue->start_transfer($h);
577 my $locked;
578 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
552 579
553 while ($h > 0) { 580 while ($h > 0) {
581 unless ($locked) {
582 if ($locked ||= $transfer->try($::WAIT_INTERVAL)) {
583 $bufsize = $::BUFSIZE;
584 $self->{time} = $::NOW;
585 }
586 }
587
588 if ($blocked{$self->{remote_id}}) {
589 $self->{h}{connection} = "close";
590 die bless {}, err::;
591 }
592
554 if (0) { 593 if (0) { # !AIO
555 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h 594 sysread $fh, $buf, $h > $bufsize ? $bufsize : $h
556 or last; 595 or last;
557 } else { 596 } else {
558 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), 597 aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h),
559 $buf, 0, sub { 598 $buf, 0, sub {
560 $r = $_[0]; 599 $r = $_[0];
561 Coro::ready($current); 600 Coro::ready($current);
562 }); 601 });
563 &Coro::schedule; 602 &Coro::schedule;
564 last unless $r; 603 last unless $r;
565 } 604 }
605
606 $tbf->request(length $buf);
566 my $w = syswrite $self->{fh}, $buf 607 my $w = syswrite $self->{fh}, $buf
567 or last; 608 or last;
568 $::written += $w; 609 $::written += $w;
569 $self->{written} += $w; 610 $self->{written} += $w;
570 $l += $r; 611 $l += $r;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines