ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing cvsroot/Coro/myhttpd/httpd.pl (file contents):
Revision 1.29 by root, Sat Aug 25 15:14:03 2001 UTC vs.
Revision 1.52 by root, Fri Nov 30 05:11:23 2001 UTC

1use Coro; 1use Coro;
2use Coro::Semaphore; 2use Coro::Semaphore;
3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5use Coro::Signal;
6
7use HTTP::Date;
8use POSIX ();
5 9
6no utf8; 10no utf8;
7use bytes; 11use bytes;
8 12
9# at least on my machine, this thingy serves files 13# at least on my machine, this thingy serves files
25 my $level = shift; 29 my $level = shift;
26 my $format = shift; 30 my $format = shift;
27 printf "---: $format\n", @_; 31 printf "---: $format\n", @_;
28} 32}
29 33
30my $connections = new Coro::Semaphore $MAX_CONNECTS; 34our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
35our $httpevent = new Coro::Signal;
36
37our $wait_factor = 0.95;
38
39our $queue_small = new transferqueue $MAX_TRANSFERS_SMALL;
40our $queue_large = new transferqueue $MAX_TRANSFERS_LARGE;
41our $queue_index = new transferqueue 5;
31 42
32my @newcons; 43my @newcons;
33my @pool; 44my @pool;
34 45
35# one "execution thread" 46# one "execution thread"
36sub handler { 47sub handler {
37 while () { 48 while () {
38 my $new = pop @newcons;
39 if ($new) { 49 if (@newcons) {
40 eval { 50 eval {
41 conn->new(@$new)->handle; 51 conn->new(@{pop @newcons})->handle;
42 }; 52 };
43 slog 1, "$@" if $@ && !ref $@; 53 slog 1, "$@" if $@ && !ref $@;
44 $connections->up; 54 $connections->up;
45 } else { 55 } else {
46 last if @pool >= $MAX_POOL; 56 last if @pool >= $MAX_POOL;
48 schedule; 58 schedule;
49 } 59 }
50 } 60 }
51} 61}
52 62
63sub listen_on {
64 my $listen = $_[0];
65
66 push @listen_sockets, $listen;
67
68 # the "main thread"
69 async {
70 slog 1, "accepting connections";
71 while () {
72 $connections->down;
73 push @newcons, [$listen->accept];
74 #slog 3, "accepted @$connections ".scalar(@pool);
75 if (@pool) {
76 (pop @pool)->ready;
77 } else {
78 async \&handler;
79 }
80
81 }
82 };
83}
84
53my $http_port = new Coro::Socket 85my $http_port = new Coro::Socket
54 LocalAddr => $SERVER_HOST, 86 LocalAddr => $SERVER_HOST,
55 LocalPort => $SERVER_PORT, 87 LocalPort => $SERVER_PORT,
56 ReuseAddr => 1, 88 ReuseAddr => 1,
57 Listen => 50, 89 Listen => 50,
58 or die "unable to start server"; 90 or die "unable to start server";
59 91
60push @listen_sockets, $http_port; 92listen_on $http_port;
61 93
62# the "main thread" 94if ($SERVER_PORT2) {
63async { 95 my $http_port = new Coro::Socket
64 slog 1, "accepting connections"; 96 LocalAddr => $SERVER_HOST,
65 while () { 97 LocalPort => $SERVER_PORT2,
66 $connections->down; 98 ReuseAddr => 1,
67 push @newcons, [$http_port->accept]; 99 Listen => 50,
68 #slog 3, "accepted @$connections ".scalar(@pool); 100 or die "unable to start server";
101
102 listen_on $http_port;
103}
104
105our $NOW;
106our $HTTP_NOW;
107
108Event->timer(interval => 1, hard => 1, cb => sub {
69 $::NOW = time; 109 $NOW = time;
70 if (@pool) { 110 $HTTP_NOW = time2str $NOW;
71 (pop @pool)->ready; 111})->now;
72 } else {
73 async \&handler;
74 }
75
76 }
77};
78 112
79package conn; 113package conn;
80 114
81use Socket; 115use Socket;
82use HTTP::Date; 116use HTTP::Date;
83use Convert::Scalar 'weaken'; 117use Convert::Scalar 'weaken';
84use Linux::AIO; 118use Linux::AIO;
85 119
86Linux::AIO::min_parallel $::AIO_PARALLEL; 120Linux::AIO::min_parallel $::AIO_PARALLEL;
87
88my $aio_requests = new Coro::Semaphore $::AIO_PARALLEL * 4;
89 121
90Event->io(fd => Linux::AIO::poll_fileno, 122Event->io(fd => Linux::AIO::poll_fileno,
91 poll => 'r', async => 1, 123 poll => 'r', async => 1,
92 cb => \&Linux::AIO::poll_cb); 124 cb => \&Linux::AIO::poll_cb);
93 125
111 143
112read_mimetypes; 144read_mimetypes;
113 145
114sub new { 146sub new {
115 my $class = shift; 147 my $class = shift;
148 my $fh = shift;
116 my $peername = shift; 149 my $peername = shift;
117 my $fh = shift;
118 my $self = bless { fh => $fh }, $class; 150 my $self = bless { fh => $fh }, $class;
119 my (undef, $iaddr) = unpack_sockaddr_in $peername 151 my (undef, $iaddr) = unpack_sockaddr_in $peername
120 or $self->err(500, "unable to decode peername"); 152 or $self->err(500, "unable to decode peername");
121 153
154 $self->{remote_addr} =
122 $self->{remote_addr} = inet_ntoa $iaddr; 155 $self->{remote_id} = inet_ntoa $iaddr;
123 $self->{time} = $::NOW; 156 $self->{time} = $::NOW;
124 157
125 # enter ourselves into various lists 158 weaken ($Coro::current->{conn} = $self);
126 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
127 159
128 $::conns++; 160 $::conns++;
129 161
130 $self; 162 $self;
131} 163}
132 164
133sub DESTROY { 165sub DESTROY {
134 my $self = shift; 166 my $self = shift;
135
136 $::conns--; 167 $::conns--;
137
138 $self->eoconn; 168 $self->eoconn;
139 delete $conn{$self->{remote_addr}}{$self*1};
140} 169}
141 170
142# end of connection 171# end of connection
143sub eoconn { 172sub eoconn {
144 my $self = shift; 173 my $self = shift;
174
175 # clean up hints
176 delete $conn{$self->{remote_id}}{$self*1};
145 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1}; 177 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1};
178
179 $httpevent->broadcast;
146} 180}
147 181
148sub slog { 182sub slog {
149 my $self = shift; 183 my $self = shift;
150 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]"); 184 main::slog($_[0], "$self->{remote_id}> $_[1]");
151} 185}
152 186
153sub response { 187sub response {
154 my ($self, $code, $msg, $hdr, $content) = @_; 188 my ($self, $code, $msg, $hdr, $content) = @_;
155 my $res = "HTTP/1.1 $code $msg\015\012"; 189 my $res = "HTTP/1.1 $code $msg\015\012";
156 190
157 $self->{h}{connection} ||= $hdr->{Connection}; 191 if (exists $hdr->{Connection}) {
192 if ($hdr->{Connection} =~ /close/) {
193 $self->{h}{connection} = "close"
194 }
195 } else {
196 if ($self->{version} < 1.1) {
197 if ($self->{h}{connection} =~ /keep-alive/i) {
198 $hdr->{Connection} = "Keep-Alive";
199 } else {
200 $self->{h}{connection} = "close"
201 }
202 }
203 }
158 204
159 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( 205 $res .= "Date: $HTTP_NOW\015\012";
160 206
161 while (my ($h, $v) = each %$hdr) { 207 while (my ($h, $v) = each %$hdr) {
162 $res .= "$h: $v\015\012" 208 $res .= "$h: $v\015\012"
163 } 209 }
164 $res .= "\015\012"; 210 $res .= "\015\012";
165 211
166 $res .= $content if defined $content and $self->{method} ne "HEAD"; 212 $res .= $content if defined $content and $self->{method} ne "HEAD";
167 213
168 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; 214 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $NOW).
215 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.
216 " \"$self->{h}{referer}\"\n";
169 217
170 print $accesslog $log if $accesslog; 218 print $accesslog $log if $accesslog;
171 print STDERR $log; 219 print STDERR $log;
172 220
173 $self->{written} += 221 $self->{written} +=
177sub err { 225sub err {
178 my $self = shift; 226 my $self = shift;
179 my ($code, $msg, $hdr, $content) = @_; 227 my ($code, $msg, $hdr, $content) = @_;
180 228
181 unless (defined $content) { 229 unless (defined $content) {
182 $content = "$code $msg"; 230 $content = "$code $msg\n";
183 $hdr->{"Content-Type"} = "text/plain"; 231 $hdr->{"Content-Type"} = "text/plain";
184 $hdr->{"Content-Length"} = length $content; 232 $hdr->{"Content-Length"} = length $content;
185 } 233 }
186 $hdr->{"Connection"} = "close"; 234 $hdr->{"Connection"} = "close";
187 235
188 $self->response($code, $msg, $hdr, $content); 236 $self->response($code, $msg, $hdr, $content);
189 237
190 die bless {}, err::; 238 die bless {}, err::;
191}
192
193sub err_blocked {
194 my $self = shift;
195 my $ip = $self->{remote_addr};
196 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
197
198 Coro::Event::do_timer(after => 20*rand);
199
200 $self->err(401, "too many connections",
201 {
202 "Content-Type" => "text/html",
203 "Retry-After" => $::BLOCKTIME,
204 "Warning" => "Please do NOT retry, you have been blocked",
205 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
206 "Connection" => "close",
207 },
208 <<EOF);
209<html>
210<head>
211<title>Too many connections</title>
212</head>
213<body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
214
215<p>You have been blocked because you opened too many connections. You
216may retry at</p>
217
218 <p><blockquote>$time.</blockquote></p>
219
220<p>Until then, each new access will renew the block. You might want to have a
221look at the <a href="http://www.goof.com/pcg/marc/animefaq.html#connectionlimit">FAQ</a>.</p>
222
223</body></html>
224EOF
225} 239}
226 240
227sub handle { 241sub handle {
228 my $self = shift; 242 my $self = shift;
229 my $fh = $self->{fh}; 243 my $fh = $self->{fh};
246 } 260 }
247 261
248 $self->{h} = {}; 262 $self->{h} = {};
249 263
250 $fh->timeout($::RES_TIMEOUT); 264 $fh->timeout($::RES_TIMEOUT);
251 my $ip = $self->{remote_addr};
252
253 if ($blocked{$ip}) {
254 $self->err_blocked($blocked{$ip})
255 if $blocked{$ip} > $::NOW;
256
257 delete $blocked{$ip};
258 }
259
260 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
261 $self->slog(2, "blocked ip $ip");
262 $self->err_blocked;
263 }
264 265
265 $req =~ /^(?:\015\012)? 266 $req =~ /^(?:\015\012)?
266 (GET|HEAD) \040+ 267 (GET|HEAD) \040+
267 ([^\040]+) \040+ 268 ([^\040]+) \040+
268 HTTP\/([0-9]+\.[0-9]+) 269 HTTP\/([0-9]+\.[0-9]+)
293 294
294 $self->{h}{$h} = substr $v, 1 295 $self->{h}{$h} = substr $v, 1
295 while ($h, $v) = each %hdr; 296 while ($h, $v) = each %hdr;
296 } 297 }
297 298
299 # remote id should be unique per user
300 my $id = $self->{remote_addr};
301
302 if (exists $self->{h}{"client-ip"}) {
303 $id .= "[".$self->{h}{"client-ip"}."]";
304 } elsif (exists $self->{h}{"x-forwarded-for"}) {
305 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
306 }
307
308 $self->{remote_id} = $id;
309
310 if ($blocked{$id}) {
311 $self->err_blocked($blocked{$id})
312 if $blocked{$id} > $::NOW;
313
314 delete $blocked{$id};
315 }
316
317 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
318 my $delay = $::PER_TIMEOUT + $::NOW + 15;
319 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
320 if ($delay < $::NOW) {
321 $self->slog(2, "blocked ip $id");
322 $self->err_blocked;
323 } else {
324 $httpevent->wait;
325 }
326 }
327 }
328
298 # find out server name and port 329 # find out server name and port
299 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { 330 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
300 $host = $1; 331 $host = $1;
301 } else { 332 } else {
302 $host = $self->{h}{host}; 333 $host = $self->{h}{host};
304 335
305 if (defined $host) { 336 if (defined $host) {
306 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80; 337 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
307 } else { 338 } else {
308 ($self->{server_port}, $host) 339 ($self->{server_port}, $host)
309 = unpack_sockaddr_in $self->{fh}->getsockname 340 = unpack_sockaddr_in $self->{fh}->sockname
310 or $self->err(500, "unable to get socket name"); 341 or $self->err(500, "unable to get socket name");
311 $host = inet_ntoa $host; 342 $host = inet_ntoa $host;
312 } 343 }
313 344
314 $self->{server_name} = $host; 345 $self->{server_name} = $host;
315 346
316 # remote id should be unique per user 347 # enter ourselves into various lists
317 $self->{remote_id} = $self->{remote_addr}; 348 weaken ($conn{$id}{$self*1} = $self);
318
319 if (exists $self->{h}{"client-ip"}) {
320 $self->{remote_id} .= "[".$self->{h}{"client-ip"}."]";
321 } elsif (exists $self->{h}{"x-forwarded-for"}) {
322 $self->{remote_id} .= "[".$self->{h}{"x-forwarded-for"}."]";
323 }
324
325 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self); 349 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self);
326 350
327 eval { 351 eval {
328 $self->map_uri; 352 $self->map_uri;
329 $self->respond; 353 $self->respond;
330 }; 354 };
331 355
332 $self->eoconn; 356 $self->eoconn;
333 357
334 die if $@ && !ref $@; 358 die if $@ && !ref $@;
335 359
336 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1; 360 last if $self->{h}{connection} =~ /close/;
361
362 $httpevent->broadcast;
337 363
338 $fh->timeout($::PER_TIMEOUT); 364 $fh->timeout($::PER_TIMEOUT);
339 } 365 }
340} 366}
341 367
391 417
392sub respond { 418sub respond {
393 my $self = shift; 419 my $self = shift;
394 my $path = $self->{path}; 420 my $path = $self->{path};
395 421
396 stat $path 422 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
397 or $self->err(404, "not found"); 423 if ($::internal{$1}) {
398 424 $::internal{$1}->($self);
399 $self->{stat} = [stat _];
400
401 # idiotic netscape sends idiotic headers AGAIN
402 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
403 ? str2time $1 : 0;
404
405 if (-d _ && -r _) {
406 # directory
407 if ($path !~ /\/$/) {
408 # create a redirect to get the trailing "/"
409 # we don't try to avoid the :80
410 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
411 } else { 425 } else {
412 $ims < $self->{stat}[9] 426 $self->err(404, "not found");
427 }
428 } else {
429
430 stat $path
413 or $self->err(304, "not modified"); 431 or $self->err(404, "not found");
414 432
415 if (-r "$path/index.html") { 433 $self->{stat} = [stat _];
416 $self->{path} .= "/index.html"; 434
417 $self->handle_file; 435 # idiotic netscape sends idiotic headers AGAIN
436 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
437 ? str2time $1 : 0;
438
439 if (-d _ && -r _) {
440 # directory
441 if ($path !~ /\/$/) {
442 # create a redirect to get the trailing "/"
443 # we don't try to avoid the :80
444 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
418 } else { 445 } else {
446 $ims < $self->{stat}[9]
447 or $self->err(304, "not modified");
448
449 if (-r "$path/index.html") {
450 # replace directory "size" by index.html filesize
451 $self->{stat}[7] = (stat ($self->{path} .= "/index.html"))[7];
452 $self->handle_file($queue_index);
453 } else {
419 $self->handle_dir; 454 $self->handle_dir;
420 } 455 }
421 } 456 }
422 } elsif (-f _ && -r _) { 457 } elsif (-f _ && -r _) {
423 -x _ and $self->err(403, "forbidden"); 458 -x _ and $self->err(403, "forbidden");
424 $self->handle_file; 459 $self->handle_file(-s _ >= $::TRANSFER_SMALL ? $queue_large : $queue_small);
425 } else { 460 } else {
426 $self->err(404, "not found"); 461 $self->err(404, "not found");
462 }
427 } 463 }
428} 464}
429 465
430sub handle_dir { 466sub handle_dir {
431 my $self = shift; 467 my $self = shift;
433 469
434 $self->response(200, "ok", 470 $self->response(200, "ok",
435 { 471 {
436 "Content-Type" => "text/html", 472 "Content-Type" => "text/html",
437 "Content-Length" => length $idx, 473 "Content-Length" => length $idx,
474 #d# directories change all the time, so X-
475 "X-Last-Modified" => time2str ((stat _)[9]),
438 }, 476 },
439 $idx); 477 $idx);
440} 478}
441 479
442sub handle_file { 480sub handle_file {
443 my $self = shift; 481 my ($self, $queue) = @_;
444 my $length = -s _; 482 my $length = $self->{stat}[7];
445 my $hdr = { 483 my $hdr = {
446 "Last-Modified" => time2str ((stat _)[9]), 484 "Last-Modified" => time2str ((stat _)[9]),
447 }; 485 };
448 486
449 my @code = (200, "ok"); 487 my @code = (200, "ok");
461 } 499 }
462 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l; 500 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
463 } 501 }
464 $hdr->{"Content-Range"} = "bytes */$length"; 502 $hdr->{"Content-Range"} = "bytes */$length";
465 $hdr->{"Content-Length"} = $length; 503 $hdr->{"Content-Length"} = $length;
466 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
467 $self->err(416, "not satisfiable", $hdr, ""); 504 $self->err(416, "not satisfiable", $hdr, "");
468 505
469satisfiable: 506satisfiable:
470 # check for segmented downloads 507 # check for segmented downloads
471 if ($l && $::NO_SEGMENTED) { 508 if ($l && $::NO_SEGMENTED) {
472 my $delay = 60; 509 my $delay = $::NOW + $::PER_TIMEOUT + 15;
473 while (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) { 510 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
474 if ($delay <= 0) { 511 if ($delay <= $::NOW) {
475 $self->err(400, "segmented downloads are not allowed", 512 $self->err_segmented_download;
476 { "Content-Type" => "text/html", Connection => "close" }, <<EOF);
477<html>
478<head>
479<title>Segmented downloads are not allowed</title>
480</head>
481<body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
482
483<p>Segmented downloads are not allowed on this server. Please refer to the
484<a href="http://www.goof.com/pcg/marc/animefaq.html#segmented_downloads">FAQ</a>.</p>
485
486</body></html>
487EOF
488 } else { 513 } else {
489 Coro::Event::do_timer(after => 3); $delay -= 3; 514 $httpevent->wait;
490 } 515 }
491 } 516 }
492 } 517 }
493 518
494 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 519 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
505 $hdr->{"Content-Length"} = $length; 530 $hdr->{"Content-Length"} = $length;
506 531
507 $self->response(@code, $hdr, ""); 532 $self->response(@code, $hdr, "");
508 533
509 if ($self->{method} eq "GET") { 534 if ($self->{method} eq "GET") {
535 $self->{time} = $::NOW;
536
537 my $current = $Coro::current;
538
510 my ($fh, $buf, $r); 539 my ($fh, $buf, $r);
511 my $current = $Coro::current; 540
512 open $fh, "<", $self->{path} 541 open $fh, "<", $self->{path}
513 or die "$self->{path}: late open failure ($!)"; 542 or die "$self->{path}: late open failure ($!)";
514 543
515 $h -= $l - 1; 544 $h -= $l - 1;
516 545
517 if (0) { 546 if (0) { # !AIO
518 if ($l) { 547 if ($l) {
519 sysseek $fh, $l, 0; 548 sysseek $fh, $l, 0;
520 } 549 }
521 } 550 }
551
552 my $transfer = $queue->start_transfer;
553 my $locked;
554 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
522 555
523 while ($h > 0) { 556 while ($h > 0) {
557 unless ($locked) {
558 if ($locked ||= $transfer->try($::WAIT_INTERVAL)) {
559 $bufsize = $::BUFSIZE;
560 $self->{time} = $::NOW;
561 }
562 }
563
524 if (0) { 564 if (0) { # !AIO
525 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h 565 sysread $fh, $buf, $h > $bufsize ? $bufsize : $h
526 or last; 566 or last;
527 } else { 567 } else {
528 undef $buf; 568 aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h),
529 $aio_requests->down;
530 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
531 $buf, 0, sub { 569 $buf, 0, sub {
532 $r = $_[0]; 570 $r = $_[0];
533 $current->ready; 571 Coro::ready($current);
534 }); 572 });
535 &Coro::schedule; 573 &Coro::schedule;
536 $aio_requests->up;
537 last unless $r; 574 last unless $r;
538 } 575 }
539 my $w = $self->{fh}->syswrite($buf) 576 my $w = syswrite $self->{fh}, $buf
540 or last; 577 or last;
541 $::written += $w; 578 $::written += $w;
542 $self->{written} += $w; 579 $self->{written} += $w;
543 $l += $r; 580 $l += $r;
544 } 581 }
545 }
546 582
547 close $fh; 583 close $fh;
584 }
548} 585}
549 586
5501; 5871;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines