ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing cvsroot/Coro/myhttpd/httpd.pl (file contents):
Revision 1.45 by root, Sun Nov 11 03:32:19 2001 UTC vs.
Revision 1.66 by root, Mon Feb 25 03:21:09 2002 UTC

3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5use Coro::Signal; 5use Coro::Signal;
6 6
7use HTTP::Date; 7use HTTP::Date;
8use POSIX ();
9
10use Compress::Zlib ();
8 11
9no utf8; 12no utf8;
10use bytes; 13use bytes;
11 14
12# at least on my machine, this thingy serves files 15# at least on my machine, this thingy serves files
14# and quite a bit slower than thttpd :( 17# and quite a bit slower than thttpd :(
15 18
16$SIG{PIPE} = 'IGNORE'; 19$SIG{PIPE} = 'IGNORE';
17 20
18our $accesslog; 21our $accesslog;
22our $errorlog;
23
24our $NOW;
25our $HTTP_NOW;
26
27Event->timer(interval => 1, hard => 1, cb => sub {
28 $NOW = time;
29 $HTTP_NOW = time2str $NOW;
30})->now;
31
32if ($ERROR_LOG) {
33 use IO::Handle;
34 open $errorlog, ">>$ERROR_LOG"
35 or die "$ERROR_LOG: $!";
36 $errorlog->autoflush(1);
37}
19 38
20if ($ACCESS_LOG) { 39if ($ACCESS_LOG) {
21 use IO::Handle; 40 use IO::Handle;
22 open $accesslog, ">>$ACCESS_LOG" 41 open $accesslog, ">>$ACCESS_LOG"
23 or die "$ACCESS_LOG: $!"; 42 or die "$ACCESS_LOG: $!";
25} 44}
26 45
27sub slog { 46sub slog {
28 my $level = shift; 47 my $level = shift;
29 my $format = shift; 48 my $format = shift;
49 my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW);
30 printf "---: $format\n", @_; 50 printf "$NOW: $format\n", @_;
51 printf $errorlog "$NOW: $format\n", @_ if $errorlog;
31} 52}
32 53
33our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; 54our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
34our $httpevent = new Coro::Signal; 55our $httpevent = new Coro::Signal;
35 56
36our $wait_factor = 0.95; 57our $queue_file = new transferqueue $MAX_TRANSFERS;
37 58our $queue_index = new transferqueue 10;
38our @transfers = (
39 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1],
40 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1],
41);
42 59
43my @newcons; 60my @newcons;
44my @pool; 61my @pool;
45 62
46# one "execution thread" 63# one "execution thread"
49 if (@newcons) { 66 if (@newcons) {
50 eval { 67 eval {
51 conn->new(@{pop @newcons})->handle; 68 conn->new(@{pop @newcons})->handle;
52 }; 69 };
53 slog 1, "$@" if $@ && !ref $@; 70 slog 1, "$@" if $@ && !ref $@;
71
72 $httpevent->broadcast; # only for testing, but doesn't matter much
73
54 $connections->up; 74 $connections->up;
55 } else { 75 } else {
56 last if @pool >= $MAX_POOL; 76 last if @pool >= $MAX_POOL;
57 push @pool, $Coro::current; 77 push @pool, $Coro::current;
58 schedule; 78 schedule;
100 or die "unable to start server"; 120 or die "unable to start server";
101 121
102 listen_on $http_port; 122 listen_on $http_port;
103} 123}
104 124
105our $NOW;
106our $HTTP_NOW;
107
108Event->timer(interval => 1, hard => 1, cb => sub {
109 $NOW = time;
110 $HTTP_NOW = time2str $NOW;
111})->now;
112
113package conn; 125package conn;
114 126
115use Socket; 127use Socket;
116use HTTP::Date; 128use HTTP::Date;
117use Convert::Scalar 'weaken'; 129use Convert::Scalar 'weaken';
149 my $peername = shift; 161 my $peername = shift;
150 my $self = bless { fh => $fh }, $class; 162 my $self = bless { fh => $fh }, $class;
151 my (undef, $iaddr) = unpack_sockaddr_in $peername 163 my (undef, $iaddr) = unpack_sockaddr_in $peername
152 or $self->err(500, "unable to decode peername"); 164 or $self->err(500, "unable to decode peername");
153 165
166 $self->{remote_addr} =
154 $self->{remote_addr} = inet_ntoa $iaddr; 167 $self->{remote_id} = inet_ntoa $iaddr;
168
155 $self->{time} = $::NOW; 169 $self->{time} = $::NOW;
156 170
171 weaken ($Coro::current->{conn} = $self);
172
157 $::conns++; 173 $::conns++;
174 $::maxconns = $::conns if $::conns > $::maxconns;
158 175
159 $self; 176 $self;
160} 177}
161 178
162sub DESTROY { 179sub DESTROY {
163 my $self = shift; 180 #my $self = shift;
164 $::conns--; 181 $::conns--;
165 $self->eoconn;
166}
167
168# end of connection
169sub eoconn {
170 my $self = shift;
171
172 # clean up hints
173 delete $conn{$self->{remote_id}}{$self*1};
174 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1};
175
176 $httpevent->broadcast;
177} 182}
178 183
179sub slog { 184sub slog {
180 my $self = shift; 185 my $self = shift;
181 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); 186 main::slog($_[0], "$self->{remote_id}> $_[1]");
182} 187}
183 188
184sub response { 189sub response {
185 my ($self, $code, $msg, $hdr, $content) = @_; 190 my ($self, $code, $msg, $hdr, $content) = @_;
186 my $res = "HTTP/1.1 $code $msg\015\012"; 191 my $res = "HTTP/1.1 $code $msg\015\012";
192 my $GZ = "";
187 193
194 if (exists $hdr->{Connection}) {
195 if ($hdr->{Connection} =~ /close/) {
188 $self->{h}{connection} = "close" 196 $self->{h}{connection} = "close"
189 if exists $hdr->{Connection} # to avoid "empty" header lines due to vivification 197 }
190 and $hdr->{Connection} =~ /close/; 198 } else {
199 if ($self->{version} < 1.1) {
200 if ($self->{h}{connection} =~ /keep-alive/i) {
201 $hdr->{Connection} = "Keep-Alive";
202 } else {
203 $self->{h}{connection} = "close"
204 }
205 }
206 }
207
208 if ($self->{method} ne "HEAD"
209 && $self->{h}{"accept-encoding"} =~ /\bgzip\b/
210 && 400 < length $content
211 && $hdr->{"Content-Length"} == length $content
212 && !exists $hdr->{"Content-Encoding"}
213 ) {
214 my $orig = length $content;
215 $hdr->{"Content-Encoding"} = "gzip";
216 $content = Compress::Zlib::memGzip(\$content);
217 $hdr->{"Content-Length"} = length $content;
218 $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig);
219 }
191 220
192 $res .= "Date: $HTTP_NOW\015\012"; 221 $res .= "Date: $HTTP_NOW\015\012";
193 222
194 while (my ($h, $v) = each %$hdr) { 223 while (my ($h, $v) = each %$hdr) {
195 $res .= "$h: $v\015\012" 224 $res .= "$h: $v\015\012"
196 } 225 }
197 $res .= "\015\012"; 226 $res .= "\015\012";
198 227
199 $res .= $content if defined $content and $self->{method} ne "HEAD"; 228 $res .= $content if defined $content and $self->{method} ne "HEAD";
200 229
201 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; 230 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW).
231 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ.
232 " \"$self->{h}{referer}\"\n";
202 233
203 print $accesslog $log if $accesslog; 234 print $::accesslog $log if $::accesslog;
204 print STDERR $log; 235 print STDERR $log;
205 236
206 $self->{written} += 237 $self->{written} +=
207 print {$self->{fh}} $res; 238 print {$self->{fh}} $res;
208} 239}
267 my (%hdr, $h, $v); 298 my (%hdr, $h, $v);
268 299
269 $hdr{lc $1} .= ",$2" 300 $hdr{lc $1} .= ",$2"
270 while $req =~ /\G 301 while $req =~ /\G
271 ([^:\000-\040]+): 302 ([^:\000-\040]+):
272 [\008\040]* 303 [\011\040]*
273 ((?: [^\015\012]+ | \015\012[\008\040] )*) 304 ((?: [^\015\012]+ | \015\012[\011\040] )*)
274 \015\012 305 \015\012
275 /gxc; 306 /gxc;
276 307
277 $req =~ /\G\015\012$/ 308 $req =~ /\G\015\012$/
278 or $self->err(400, "bad request"); 309 or $self->err(400, "bad request");
290 $id .= "[".$self->{h}{"x-forwarded-for"}."]"; 321 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
291 } 322 }
292 323
293 $self->{remote_id} = $id; 324 $self->{remote_id} = $id;
294 325
326 weaken (local $conn{$id}{$self*1} = $self);
327
295 if ($blocked{$id}) { 328 if ($blocked{$id}) {
296 $self->err_blocked($blocked{$id}) 329 $self->err_blocked
297 if $blocked{$id} > $::NOW; 330 if $blocked{$id}[0] > $::NOW;
298 331
299 delete $blocked{$id}; 332 delete $blocked{$id};
300 }
301
302 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
303 my $delay = $::PER_TIMEOUT + $::NOW + 15;
304 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
305 if ($delay < $::NOW) {
306 $self->slog(2, "blocked ip $id");
307 $self->err_blocked;
308 } else {
309 $httpevent->wait;
310 }
311 }
312 } 333 }
313 334
314 # find out server name and port 335 # find out server name and port
315 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { 336 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
316 $host = $1; 337 $host = $1;
327 $host = inet_ntoa $host; 348 $host = inet_ntoa $host;
328 } 349 }
329 350
330 $self->{server_name} = $host; 351 $self->{server_name} = $host;
331 352
332 # enter ourselves into various lists
333 weaken ($conn{$id}{$self*1} = $self);
334 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self); 353 weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self);
335 354
336 eval { 355 eval {
337 $self->map_uri; 356 $self->map_uri;
338 $self->respond; 357 $self->respond;
339 }; 358 };
340 359
341 $self->eoconn;
342
343 die if $@ && !ref $@; 360 die if $@ && !ref $@;
344 361
345 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1; 362 last if $self->{h}{connection} =~ /close/i;
346 363
347 $httpevent->broadcast; 364 $httpevent->broadcast;
348 365
349 $fh->timeout($::PER_TIMEOUT); 366 $fh->timeout($::PER_TIMEOUT);
350 } 367 }
368}
369
370sub block {
371 my $self = shift;
372
373 $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]];
374 $self->slog(2, "blocked ip $self->{remote_id}");
375 $self->err_blocked;
351} 376}
352 377
353# uri => path mapping 378# uri => path mapping
354sub map_uri { 379sub map_uri {
355 my $self = shift; 380 my $self = shift;
402 427
403sub respond { 428sub respond {
404 my $self = shift; 429 my $self = shift;
405 my $path = $self->{path}; 430 my $path = $self->{path};
406 431
407 stat $path 432 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
408 or $self->err(404, "not found"); 433 if ($::internal{$1}) {
409 434 $::internal{$1}->($self);
410 $self->{stat} = [stat _];
411
412 # idiotic netscape sends idiotic headers AGAIN
413 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
414 ? str2time $1 : 0;
415
416 if (-d _ && -r _) {
417 # directory
418 if ($path !~ /\/$/) {
419 # create a redirect to get the trailing "/"
420 # we don't try to avoid the :80
421 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
422 } else { 435 } else {
423 $ims < $self->{stat}[9] 436 $self->err(404, "not found");
437 }
438 } else {
439
440 stat $path
424 or $self->err(304, "not modified"); 441 or $self->err(404, "not found");
425 442
426 if (-r "$path/index.html") { 443 $self->{stat} = [stat _];
427 # replace directory "size" by index.html filesize 444
428 $self->{stat}[7] = (stat ($self->{path} .= "/index.html"))[7]; 445 # idiotic netscape sends idiotic headers AGAIN
429 $self->handle_file; 446 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
447 ? str2time $1 : 0;
448
449 if (-d _ && -r _) {
450 # directory
451 if ($path !~ /\/$/) {
452 # create a redirect to get the trailing "/"
453 # we don't try to avoid the :80
454 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
430 } else { 455 } else {
456 $ims < $self->{stat}[9]
457 or $self->err(304, "not modified");
458
459 if (-r "$path/index.html") {
460 # replace directory "size" by index.html filesize
461 $self->{stat} = [stat ($self->{path} .= "/index.html")];
462 $self->handle_file($queue_index);
463 } else {
431 $self->handle_dir; 464 $self->handle_dir;
432 } 465 }
433 } 466 }
434 } elsif (-f _ && -r _) { 467 } elsif (-f _ && -r _) {
435 -x _ and $self->err(403, "forbidden"); 468 -x _ and $self->err(403, "forbidden");
469
470 if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
471 my $timeout = $::NOW + 10;
472 while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
473 if ($timeout < $::NOW) {
474 $self->block($::BLOCKTIME, "too many connections");
475 } else {
476 $httpevent->wait;
477 }
478 }
479 }
480
436 $self->handle_file; 481 $self->handle_file($queue_file);
437 } else { 482 } else {
438 $self->err(404, "not found"); 483 $self->err(404, "not found");
484 }
439 } 485 }
440} 486}
441 487
442sub handle_dir { 488sub handle_dir {
443 my $self = shift; 489 my $self = shift;
445 491
446 $self->response(200, "ok", 492 $self->response(200, "ok",
447 { 493 {
448 "Content-Type" => "text/html", 494 "Content-Type" => "text/html",
449 "Content-Length" => length $idx, 495 "Content-Length" => length $idx,
496 "Last-Modified" => time2str ($self->{stat}[9]),
450 }, 497 },
451 $idx); 498 $idx);
452} 499}
453 500
454sub handle_file { 501sub handle_file {
455 my $self = shift; 502 my ($self, $queue) = @_;
456 my $length = $self->{stat}[7]; 503 my $length = $self->{stat}[7];
457 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
458 my $hdr = { 504 my $hdr = {
459 "Last-Modified" => time2str ((stat _)[9]), 505 "Last-Modified" => time2str ((stat _)[9]),
460 }; 506 };
461 507
462 my @code = (200, "ok"); 508 my @code = (200, "ok");
479 $self->err(416, "not satisfiable", $hdr, ""); 525 $self->err(416, "not satisfiable", $hdr, "");
480 526
481satisfiable: 527satisfiable:
482 # check for segmented downloads 528 # check for segmented downloads
483 if ($l && $::NO_SEGMENTED) { 529 if ($l && $::NO_SEGMENTED) {
484 my $delay = $::NOW + $::PER_TIMEOUT + 15; 530 my $timeout = $::NOW + 15;
485 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { 531 while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
486 if ($delay <= $::NOW) { 532 if ($timeout <= $::NOW) {
533 $self->block($::BLOCKTIME, "segmented downloads are forbidden");
487 $self->err_segmented_download; 534 #$self->err_segmented_download;
488 } else { 535 } else {
489 $httpevent->broadcast; 536 $httpevent->wait;
490 } 537 }
491 } 538 }
492 } 539 }
493 540
494 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 541 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
507 $self->response(@code, $hdr, ""); 554 $self->response(@code, $hdr, "");
508 555
509 if ($self->{method} eq "GET") { 556 if ($self->{method} eq "GET") {
510 $self->{time} = $::NOW; 557 $self->{time} = $::NOW;
511 558
512 my $fudge = $queue->[0]->waiters; 559 my $current = $Coro::current;
513 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
514
515 $queue->[1] *= $fudge;
516 my $transfer = $queue->[0]->guard;
517
518 if ($fudge != 1) {
519 $queue->[1] /= $fudge;
520 $queue->[1] = $queue->[1] * $::wait_factor
521 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
522 }
523 $self->{time} = $::NOW;
524
525 $self->{fh}->writable or return;
526 560
527 my ($fh, $buf, $r); 561 my ($fh, $buf, $r);
528 my $current = $Coro::current; 562
529 open $fh, "<", $self->{path} 563 open $fh, "<", $self->{path}
530 or die "$self->{path}: late open failure ($!)"; 564 or die "$self->{path}: late open failure ($!)";
531 565
532 $h -= $l - 1; 566 $h -= $l - 1;
533 567
534 if (0) { 568 if (0) { # !AIO
535 if ($l) { 569 if ($l) {
536 sysseek $fh, $l, 0; 570 sysseek $fh, $l, 0;
537 } 571 }
538 } 572 }
573
574 my $transfer = $queue->start_transfer($h);
575 my $locked;
576 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
539 577
540 while ($h > 0) { 578 while ($h > 0) {
579 unless ($locked) {
580 if ($locked ||= $transfer->try($::WAIT_INTERVAL)) {
581 $bufsize = $::BUFSIZE;
582 $self->{time} = $::NOW;
583 }
584 }
585
586 if ($blocked{$self->{remote_id}}) {
587 $self->{h}{connection} = "close";
588 die bless {}, err::;
589 }
590
541 if (0) { 591 if (0) { # !AIO
542 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h 592 sysread $fh, $buf, $h > $bufsize ? $bufsize : $h
543 or last; 593 or last;
544 } else { 594 } else {
545 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), 595 aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h),
546 $buf, 0, sub { 596 $buf, 0, sub {
547 $r = $_[0]; 597 $r = $_[0];
548 Coro::ready($current); 598 Coro::ready($current);
549 }); 599 });
550 &Coro::schedule; 600 &Coro::schedule;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines