ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing Coro/myhttpd/httpd.pl (file contents):
Revision 1.41 by root, Mon Sep 10 22:16:20 2001 UTC vs.
Revision 1.76 by root, Wed Jul 13 13:58:51 2005 UTC

1use Coro; 1use Coro;
2use Coro::Semaphore; 2use Coro::Semaphore;
3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5use Coro::Signal;
5 6
6use HTTP::Date; 7use HTTP::Date;
8use POSIX ();
9
10use Compress::Zlib ();
7 11
8no utf8; 12no utf8;
9use bytes; 13use bytes;
10 14
11# at least on my machine, this thingy serves files 15# at least on my machine, this thingy serves files
13# and quite a bit slower than thttpd :( 17# and quite a bit slower than thttpd :(
14 18
15$SIG{PIPE} = 'IGNORE'; 19$SIG{PIPE} = 'IGNORE';
16 20
17our $accesslog; 21our $accesslog;
22our $errorlog;
23
24our $NOW;
25our $HTTP_NOW;
26
27Event->timer(interval => 1, hard => 1, cb => sub {
28 $NOW = time;
29 $HTTP_NOW = time2str $NOW;
30})->now;
31
32if ($ERROR_LOG) {
33 use IO::Handle;
34 open $errorlog, ">>$ERROR_LOG"
35 or die "$ERROR_LOG: $!";
36 $errorlog->autoflush(1);
37}
18 38
19if ($ACCESS_LOG) { 39if ($ACCESS_LOG) {
20 use IO::Handle; 40 use IO::Handle;
21 open $accesslog, ">>$ACCESS_LOG" 41 open $accesslog, ">>$ACCESS_LOG"
22 or die "$ACCESS_LOG: $!"; 42 or die "$ACCESS_LOG: $!";
24} 44}
25 45
26sub slog { 46sub slog {
27 my $level = shift; 47 my $level = shift;
28 my $format = shift; 48 my $format = shift;
49 my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW);
29 printf "---: $format\n", @_; 50 printf "$NOW: $format\n", @_;
51 printf $errorlog "$NOW: $format\n", @_ if $errorlog;
30} 52}
31 53
32our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; 54our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
55our $httpevent = new Coro::Signal;
33 56
34our $wait_factor = 0.95; 57our $queue_file = new transferqueue $MAX_TRANSFERS;
58our $queue_index = new transferqueue 10;
35 59
36our @transfers = ( 60our $tbf_top = new tbf rate => $TBF_RATE || 100000;
37 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1], 61
38 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1], 62my $unused_bytes = 0;
39); 63my $unused_last = time;
64
65sub unused_bandwidth {
66 $unused_bytes += $_[0];
67 if ($unused_last < $NOW - 30 && $unused_bytes / ($NOW - $unused_last) > 50000) {
68 $unused_last = $NOW;
69 $unused_bytes = 0;
70 $queue_file->force_wake_next;
71 slog 1, "forced filetransfer due to unused bandwidth";
72 }
73}
40 74
41my @newcons; 75my @newcons;
42my @pool; 76my @pool;
43 77
44# one "execution thread" 78# one "execution thread"
47 if (@newcons) { 81 if (@newcons) {
48 eval { 82 eval {
49 conn->new(@{pop @newcons})->handle; 83 conn->new(@{pop @newcons})->handle;
50 }; 84 };
51 slog 1, "$@" if $@ && !ref $@; 85 slog 1, "$@" if $@ && !ref $@;
86
87 $httpevent->broadcast; # only for testing, but doesn't matter much
88
52 $connections->up; 89 $connections->up;
53 } else { 90 } else {
54 last if @pool >= $MAX_POOL; 91 last if @pool >= $MAX_POOL;
55 push @pool, $Coro::current; 92 push @pool, $Coro::current;
56 schedule; 93 schedule;
73 if (@pool) { 110 if (@pool) {
74 (pop @pool)->ready; 111 (pop @pool)->ready;
75 } else { 112 } else {
76 async \&handler; 113 async \&handler;
77 } 114 }
78
79 } 115 }
80 }; 116 };
81} 117}
82 118
83my $http_port = new Coro::Socket 119my $http_port = new Coro::Socket
98 or die "unable to start server"; 134 or die "unable to start server";
99 135
100 listen_on $http_port; 136 listen_on $http_port;
101} 137}
102 138
103our $NOW;
104our $HTTP_NOW;
105
106Event->timer(interval => 1, hard => 1, cb => sub {
107 $NOW = time;
108 $HTTP_NOW = time2str $NOW;
109})->now;
110
111package conn; 139package conn;
112 140
113use Socket; 141use Socket;
114use HTTP::Date; 142use HTTP::Date;
115use Convert::Scalar 'weaken'; 143use Convert::Scalar 'weaken';
141 169
142read_mimetypes; 170read_mimetypes;
143 171
144sub new { 172sub new {
145 my $class = shift; 173 my $class = shift;
174 my $fh = shift;
146 my $peername = shift; 175 my $peername = shift;
147 my $fh = shift;
148 my $self = bless { fh => $fh }, $class; 176 my $self = bless { fh => $fh }, $class;
149 my (undef, $iaddr) = unpack_sockaddr_in $peername 177 my (undef, $iaddr) = unpack_sockaddr_in $peername
150 or $self->err(500, "unable to decode peername"); 178 or $self->err(500, "unable to decode peername");
151 179
180 $self->{remote_addr} =
152 $self->{remote_addr} = inet_ntoa $iaddr; 181 $self->{remote_id} = inet_ntoa $iaddr;
182
153 $self->{time} = $::NOW; 183 $self->{time} = $::NOW;
154 184
185 weaken ($Coro::current->{conn} = $self);
186
155 $::conns++; 187 $::conns++;
188 $::maxconns = $::conns if $::conns > $::maxconns;
156 189
157 $self; 190 $self;
158} 191}
159 192
160sub DESTROY { 193sub DESTROY {
161 my $self = shift; 194 #my $self = shift;
162 $::conns--; 195 $::conns--;
163 $self->eoconn;
164} 196}
165 197
166# end of connection 198sub prune_cache {
167sub eoconn { 199 my $hash = $_[0];
168 my $self = shift;
169 200
170 # clean up hints 201 for (keys %$hash) {
171 delete $conn{$self->{remote_id}}{$self*1}; 202 if (ref $hash->{$_} eq HASH::) {
172 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1}; 203 prune_cache($hash->{$_});
204 unless (scalar keys %{$hash->{$_}}) {
205 delete $hash->{$_};
206 $d2++;
207 }
208 }
209 }
173} 210}
211
212sub prune_caches {
213 prune_cache \%conn;
214 prune_cache \%uri;
215
216 for (keys %blocked) {
217 delete $blocked{$_} unless $blocked{$_}[0] > $::NOW;
218 }
219}
220
221Event->timer(interval => 60, cb => \&prune_caches);
174 222
175sub slog { 223sub slog {
176 my $self = shift; 224 my $self = shift;
177 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); 225 main::slog($_[0], "$self->{remote_id}> $_[1]");
178} 226}
179 227
180sub response { 228sub response {
181 my ($self, $code, $msg, $hdr, $content) = @_; 229 my ($self, $code, $msg, $hdr, $content) = @_;
182 my $res = "HTTP/1.1 $code $msg\015\012"; 230 my $res = "HTTP/1.1 $code $msg\015\012";
231 my $GZ = "";
183 232
184 $self->{h}{connection} ||= $hdr->{Connection}; 233 if (exists $hdr->{Connection}) {
234 if ($hdr->{Connection} =~ /close/) {
235 $self->{h}{connection} = "close"
236 }
237 } else {
238 if ($self->{version} < 1.1) {
239 if ($self->{h}{connection} =~ /keep-alive/i) {
240 $hdr->{Connection} = "Keep-Alive";
241 } else {
242 $self->{h}{connection} = "close"
243 }
244 }
245 }
246
247 if ($self->{method} ne "HEAD"
248 && $self->{h}{"accept-encoding"} =~ /\bgzip\b/
249 && 400 < length $content
250 && $hdr->{"Content-Length"} == length $content
251 && !exists $hdr->{"Content-Encoding"}
252 ) {
253 my $orig = length $content;
254 $hdr->{"Content-Encoding"} = "gzip";
255 $content = Compress::Zlib::memGzip(\$content);
256 $hdr->{"Content-Length"} = length $content;
257 $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig);
258 }
185 259
186 $res .= "Date: $HTTP_NOW\015\012"; 260 $res .= "Date: $HTTP_NOW\015\012";
261 $res .= "Server: $::NAME\015\012";
187 262
188 while (my ($h, $v) = each %$hdr) { 263 while (my ($h, $v) = each %$hdr) {
189 $res .= "$h: $v\015\012" 264 $res .= "$h: $v\015\012"
190 } 265 }
191 $res .= "\015\012"; 266 $res .= "\015\012";
192 267
193 $res .= $content if defined $content and $self->{method} ne "HEAD"; 268 $res .= $content if defined $content and $self->{method} ne "HEAD";
194 269
195 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; 270 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW).
271 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ.
272 " \"$self->{h}{referer}\"\n";
196 273
197 print $accesslog $log if $accesslog; 274 print $::accesslog $log if $::accesslog;
198 print STDERR $log; 275 print STDERR $log;
199 276
200 $self->{written} += 277 $tbf_top->request(length $res, 1e6);
201 print {$self->{fh}} $res; 278 $self->{written} += print {$self->{fh}} $res;
202} 279}
203 280
204sub err { 281sub err {
205 my $self = shift; 282 my $self = shift;
206 my ($code, $msg, $hdr, $content) = @_; 283 my ($code, $msg, $hdr, $content) = @_;
261 my (%hdr, $h, $v); 338 my (%hdr, $h, $v);
262 339
263 $hdr{lc $1} .= ",$2" 340 $hdr{lc $1} .= ",$2"
264 while $req =~ /\G 341 while $req =~ /\G
265 ([^:\000-\040]+): 342 ([^:\000-\040]+):
266 [\008\040]* 343 [\011\040]*
267 ((?: [^\015\012]+ | \015\012[\008\040] )*) 344 ((?: [^\015\012]+ | \015\012[\011\040] )*)
268 \015\012 345 \015\012
269 /gxc; 346 /gxc;
270 347
271 $req =~ /\G\015\012$/ 348 $req =~ /\G\015\012$/
272 or $self->err(400, "bad request"); 349 or $self->err(400, "bad request");
284 $id .= "[".$self->{h}{"x-forwarded-for"}."]"; 361 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
285 } 362 }
286 363
287 $self->{remote_id} = $id; 364 $self->{remote_id} = $id;
288 365
366 weaken (local $conn{$id}{$self*1} = $self);
367
289 if ($blocked{$id}) { 368 if ($blocked{$id}) {
290 $self->err_blocked($blocked{$id}) 369 $self->err_blocked
291 if $blocked{$id} > $::NOW; 370 if $blocked{$id}[0] > $::NOW;
292 371
293 delete $blocked{$id}; 372 delete $blocked{$id};
294 }
295
296 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
297 my $delay = $::PER_TIMEOUT + 15;
298 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
299 if ($delay <= 0) {
300 $self->slog(2, "blocked ip $id");
301 $self->err_blocked;
302 } else {
303 Coro::Event::do_timer(after => 4); $delay -= 4;
304 }
305 }
306 } 373 }
307 374
308 # find out server name and port 375 # find out server name and port
309 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { 376 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
310 $host = $1; 377 $host = $1;
314 381
315 if (defined $host) { 382 if (defined $host) {
316 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80; 383 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
317 } else { 384 } else {
318 ($self->{server_port}, $host) 385 ($self->{server_port}, $host)
319 = unpack_sockaddr_in $self->{fh}->getsockname 386 = unpack_sockaddr_in $self->{fh}->sockname
320 or $self->err(500, "unable to get socket name"); 387 or $self->err(500, "unable to get socket name");
321 $host = inet_ntoa $host; 388 $host = inet_ntoa $host;
322 } 389 }
323 390
324 $self->{server_name} = $host; 391 $self->{server_name} = $host;
325 392
326 # enter ourselves into various lists
327 weaken ($conn{$id}{$self*1} = $self);
328 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self); 393 weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self);
329 394
330 eval { 395 eval {
331 $self->map_uri; 396 $self->map_uri;
332 $self->respond; 397 $self->respond;
333 }; 398 };
334 399
335 $self->eoconn;
336
337 die if $@ && !ref $@; 400 die if $@ && !ref $@;
338 401
339 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1; 402 last if $self->{h}{connection} =~ /close/i;
403
404 $httpevent->broadcast;
340 405
341 $fh->timeout($::PER_TIMEOUT); 406 $fh->timeout($::PER_TIMEOUT);
342 } 407 }
408}
409
410sub block {
411 my $self = shift;
412
413 $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]];
414 $self->slog(2, "blocked ip $self->{remote_id}");
415 $self->err_blocked;
343} 416}
344 417
345# uri => path mapping 418# uri => path mapping
346sub map_uri { 419sub map_uri {
347 my $self = shift; 420 my $self = shift;
394 467
395sub respond { 468sub respond {
396 my $self = shift; 469 my $self = shift;
397 my $path = $self->{path}; 470 my $path = $self->{path};
398 471
399 stat $path 472 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
400 or $self->err(404, "not found"); 473 if ($::internal{$1}) {
401 474 $::internal{$1}->($self);
402 $self->{stat} = [stat _];
403
404 # idiotic netscape sends idiotic headers AGAIN
405 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
406 ? str2time $1 : 0;
407
408 if (-d _ && -r _) {
409 # directory
410 if ($path !~ /\/$/) {
411 # create a redirect to get the trailing "/"
412 # we don't try to avoid the :80
413 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
414 } else { 475 } else {
415 $ims < $self->{stat}[9] 476 $self->err(404, "not found");
477 }
478 } else {
479
480 stat $path
416 or $self->err(304, "not modified"); 481 or $self->err(404, "not found");
417 482
418 if (-r "$path/index.html") { 483 $self->{stat} = [stat _];
419 $self->{path} .= "/index.html"; 484
420 $self->handle_file; 485 # idiotic netscape sends idiotic headers AGAIN
486 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
487 ? str2time $1 : 0;
488
489 if (-d _ && -r _) {
490 # directory
491 if ($path !~ /\/$/) {
492 # create a redirect to get the trailing "/"
493 # we don't try to avoid the :80
494 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
421 } else { 495 } else {
496 $ims < $self->{stat}[9]
497 or $self->err(304, "not modified");
498
499 if (-r "$path/index.html") {
500 # replace directory "size" by index.html filesize
501 $self->{stat} = [stat ($self->{path} .= "/index.html")];
502 $self->handle_file($queue_index, $tbf_top);
503 } else {
422 $self->handle_dir; 504 $self->handle_dir;
423 } 505 }
424 } 506 }
425 } elsif (-f _ && -r _) { 507 } elsif (-f _ && -r _) {
426 -x _ and $self->err(403, "forbidden"); 508 -x _ and $self->err(403, "forbidden");
427 $self->handle_file; 509
510 if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
511 my $timeout = $::NOW + 10;
512 while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
513 if ($timeout < $::NOW) {
514 $self->block($::BLOCKTIME, "too many connections");
515 } else {
516 $httpevent->wait;
517 }
518 }
519 }
520
521 $self->handle_file($queue_file, $tbf_top);
428 } else { 522 } else {
429 $self->err(404, "not found"); 523 $self->err(404, "not found");
524 }
430 } 525 }
431} 526}
432 527
433sub handle_dir { 528sub handle_dir {
434 my $self = shift; 529 my $self = shift;
435 my $idx = $self->diridx; 530 my $idx = $self->diridx;
436 531
437 $self->response(200, "ok", 532 $self->response(200, "ok",
438 { 533 {
439 "Content-Type" => "text/html", 534 "Content-Type" => "text/html; charset=utf-8",
440 "Content-Length" => length $idx, 535 "Content-Length" => length $idx,
536 "Last-Modified" => time2str ($self->{stat}[9]),
441 }, 537 },
442 $idx); 538 $idx);
443} 539}
444 540
445sub handle_file { 541sub handle_file {
446 my $self = shift; 542 my ($self, $queue, $tbf) = @_;
447 my $length = $self->{stat}[7]; 543 my $length = $self->{stat}[7];
448 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
449 my $hdr = { 544 my $hdr = {
450 "Last-Modified" => time2str ((stat _)[9]), 545 "Last-Modified" => time2str ((stat _)[9]),
546 "Accept-Ranges" => "bytes",
451 }; 547 };
452 548
453 my @code = (200, "ok"); 549 my @code = (200, "ok");
454 my ($l, $h); 550 my ($l, $h);
455 551
470 $self->err(416, "not satisfiable", $hdr, ""); 566 $self->err(416, "not satisfiable", $hdr, "");
471 567
472satisfiable: 568satisfiable:
473 # check for segmented downloads 569 # check for segmented downloads
474 if ($l && $::NO_SEGMENTED) { 570 if ($l && $::NO_SEGMENTED) {
475 my $delay = $::PER_TIMEOUT + 15; 571 my $timeout = $::NOW + 15;
476 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { 572 while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
477 if ($delay <= 0) { 573 if ($timeout <= $::NOW) {
574 $self->block($::BLOCKTIME, "segmented downloads are forbidden");
478 $self->err_segmented_download; 575 #$self->err_segmented_download;
479 } else { 576 } else {
480 Coro::Event::do_timer(after => 4); $delay -= 4; 577 $httpevent->wait;
481 } 578 }
482 } 579 }
483 } 580 }
484 581
485 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 582 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
497 594
498 $self->response(@code, $hdr, ""); 595 $self->response(@code, $hdr, "");
499 596
500 if ($self->{method} eq "GET") { 597 if ($self->{method} eq "GET") {
501 $self->{time} = $::NOW; 598 $self->{time} = $::NOW;
502
503 my $fudge = $queue->[0]->waiters;
504 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
505
506 $queue->[1] *= $fudge;
507 my $transfer = $queue->[0]->guard;
508
509 if ($fudge != 1) {
510 $queue->[1] /= $fudge;
511 $queue->[1] = $queue->[1] * $::wait_factor
512 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
513 }
514 $self->{time} = $::NOW; 599 $self->{written} = 0;
515 600
516 $self->{fh}->writable or return; 601 my $current = $Coro::current;
517 602
518 my ($fh, $buf, $r); 603 my ($fh, $buf, $r);
519 my $current = $Coro::current; 604
520 open $fh, "<", $self->{path} 605 open $fh, "<", $self->{path}
521 or die "$self->{path}: late open failure ($!)"; 606 or die "$self->{path}: late open failure ($!)";
522 607
523 $h -= $l - 1; 608 $h -= $l - 1;
524 609
525 if (0) { 610 if (0) { # !AIO
526 if ($l) { 611 if ($l) {
527 sysseek $fh, $l, 0; 612 sysseek $fh, $l, 0;
528 } 613 }
529 } 614 }
615
616 my $transfer = $queue->start_transfer($h);
617 my $locked;
618 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
530 619
531 while ($h > 0) { 620 while ($h > 0) {
621 unless ($locked) {
622 if ($locked ||= $transfer->try($::WAIT_INTERVAL)) {
623 $bufsize = $::BUFSIZE;
624 $self->{time} = $::NOW;
625 $self->{written} = 0;
626 }
627 }
628
629 if ($blocked{$self->{remote_id}}) {
630 $self->{h}{connection} = "close";
631 die bless {}, err::;
632 }
633
532 if (0) { 634 if (0) { # !AIO
533 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h 635 sysread $fh, $buf, $h > $bufsize ? $bufsize : $h
534 or last; 636 or last;
535 } else { 637 } else {
536 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), 638 aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h),
537 $buf, 0, sub { 639 $buf, 0, sub {
538 $r = $_[0]; 640 $r = $_[0];
539 Coro::ready($current); 641 Coro::ready($current);
540 }); 642 });
541 &Coro::schedule; 643 &Coro::schedule;
542 last unless $r; 644 last unless $r;
543 } 645 }
646
647 $tbf->request(length $buf);
544 my $w = syswrite $self->{fh}, $buf 648 my $w = syswrite $self->{fh}, $buf
545 or last; 649 or last;
546 $::written += $w; 650 $::written += $w;
547 $self->{written} += $w; 651 $self->{written} += $w;
548 $l += $r; 652 $l += $r;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines