ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing cvsroot/Coro/myhttpd/httpd.pl (file contents):
Revision 1.13 by root, Sun Aug 12 01:16:48 2001 UTC vs.
Revision 1.37 by root, Sun Sep 2 01:03:53 2001 UTC

1use Coro; 1use Coro;
2use Coro::Semaphore; 2use Coro::Semaphore;
3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5 5
6use HTTP::Date;
7
6no utf8; 8no utf8;
7use bytes; 9use bytes;
8 10
9# at least on my machine, this thingy serves files 11# at least on my machine, this thingy serves files
10# quite a bit faster than apache, ;) 12# quite a bit faster than apache, ;)
11# and quite a bit slower than thttpd :( 13# and quite a bit slower than thttpd :(
12 14
13$SIG{PIPE} = 'IGNORE'; 15$SIG{PIPE} = 'IGNORE';
14 16
17our $accesslog;
18
19if ($ACCESS_LOG) {
20 use IO::Handle;
21 open $accesslog, ">>$ACCESS_LOG"
22 or die "$ACCESS_LOG: $!";
23 $accesslog->autoflush(1);
24}
25
15sub slog { 26sub slog {
16 my $level = shift; 27 my $level = shift;
17 my $format = shift; 28 my $format = shift;
18 printf "---: $format\n", @_; 29 printf "---: $format\n", @_;
19} 30}
20 31
21my $connections = new Coro::Semaphore $MAX_CONNECTS; 32our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
33
34our $wait_factor = 0.95;
35
36our @transfers = (
37 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1],
38 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1],
39);
22 40
23my @newcons; 41my @newcons;
24my @pool; 42my @pool;
25 43
26# one "execution thread" 44# one "execution thread"
48 Listen => 50, 66 Listen => 50,
49 or die "unable to start server"; 67 or die "unable to start server";
50 68
51push @listen_sockets, $http_port; 69push @listen_sockets, $http_port;
52 70
71our $NOW;
72our $HTTP_NOW;
73
74Event->timer(interval => 1, hard => 1, cb => sub {
75 $NOW = time;
76 $HTTP_NOW = time2str $NOW;
77})->now;
78
53# the "main thread" 79# the "main thread"
54async { 80async {
55 slog 1, "accepting connections"; 81 slog 1, "accepting connections";
56 while () { 82 while () {
57 $connections->down; 83 $connections->down;
58 push @newcons, [$http_port->accept]; 84 push @newcons, [$http_port->accept];
59 #slog 3, "accepted @$connections ".scalar(@pool); 85 #slog 3, "accepted @$connections ".scalar(@pool);
60 $::NOW = time;
61 if (@pool) { 86 if (@pool) {
62 (pop @pool)->ready; 87 (pop @pool)->ready;
63 } else { 88 } else {
64 async \&handler; 89 async \&handler;
65 } 90 }
70package conn; 95package conn;
71 96
72use Socket; 97use Socket;
73use HTTP::Date; 98use HTTP::Date;
74use Convert::Scalar 'weaken'; 99use Convert::Scalar 'weaken';
100use Linux::AIO;
75 101
102Linux::AIO::min_parallel $::AIO_PARALLEL;
103
104Event->io(fd => Linux::AIO::poll_fileno,
105 poll => 'r', async => 1,
106 cb => \&Linux::AIO::poll_cb);
107
76our %conn; # $conn{ip}{fh} => connobj 108our %conn; # $conn{ip}{self} => connobj
109our %uri; # $uri{ip}{uri}{self}
77our %blocked; 110our %blocked;
78our %mimetype; 111our %mimetype;
79 112
80sub read_mimetypes { 113sub read_mimetypes {
81 local *M; 114 local *M;
101 or $self->err(500, "unable to decode peername"); 134 or $self->err(500, "unable to decode peername");
102 135
103 $self->{remote_addr} = inet_ntoa $iaddr; 136 $self->{remote_addr} = inet_ntoa $iaddr;
104 $self->{time} = $::NOW; 137 $self->{time} = $::NOW;
105 138
106 # enter ourselves into various lists
107 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
108
109 $::conns++; 139 $::conns++;
110 140
111 $self; 141 $self;
112} 142}
113 143
114sub DESTROY { 144sub DESTROY {
115 my $self = shift; 145 my $self = shift;
116 146
117 $::conns--; 147 $::conns--;
118 148
149 $self->eoconn;
150}
151
152# end of connection
153sub eoconn {
154 my $self = shift;
155
156 # clean up hints
119 delete $conn{$self->{remote_addr}}{$self*1}; 157 delete $conn{$self->{remote_id}}{$self*1};
120 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1}; 158 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1};
121} 159}
122 160
123sub slog { 161sub slog {
124 my $self = shift; 162 my $self = shift;
125 main::slog($_[0], "$self->{remote_addr}> $_[1]"); 163 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
126} 164}
127 165
128sub response { 166sub response {
129 my ($self, $code, $msg, $hdr, $content) = @_; 167 my ($self, $code, $msg, $hdr, $content) = @_;
130 my $res = "HTTP/1.0 $code $msg\015\012"; 168 my $res = "HTTP/1.1 $code $msg\015\012";
131 169
132 $res .= "Connection: close\015\012"; 170 $self->{h}{connection} ||= $hdr->{Connection};
133 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( 171
172 $res .= "Date: $HTTP_NOW\015\012";
134 173
135 while (my ($h, $v) = each %$hdr) { 174 while (my ($h, $v) = each %$hdr) {
136 $res .= "$h: $v\015\012" 175 $res .= "$h: $v\015\012"
137 } 176 }
138 $res .= "\015\012"; 177 $res .= "\015\012";
139 178
140 $res .= $content if defined $content and $self->{method} ne "HEAD"; 179 $res .= $content if defined $content and $self->{method} ne "HEAD";
141 180
142 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d# 181 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
182
183 print $accesslog $log if $accesslog;
184 print STDERR $log;
143 185
144 $self->{written} += 186 $self->{written} +=
145 print {$self->{fh}} $res; 187 print {$self->{fh}} $res;
146} 188}
147 189
148sub err { 190sub err {
149 my $self = shift; 191 my $self = shift;
150 my ($code, $msg, $hdr, $content) = @_; 192 my ($code, $msg, $hdr, $content) = @_;
151 193
152 unless (defined $content) { 194 unless (defined $content) {
153 $content = "$code $msg"; 195 $content = "$code $msg\n";
154 $hdr->{"Content-Type"} = "text/plain"; 196 $hdr->{"Content-Type"} = "text/plain";
155 $hdr->{"Content-Length"} = length $content; 197 $hdr->{"Content-Length"} = length $content;
156 } 198 }
199 $hdr->{"Connection"} = "close";
157 200
158 $self->response($code, $msg, $hdr, $content); 201 $self->response($code, $msg, $hdr, $content);
159 202
160 die bless {}, err::; 203 die bless {}, err::;
161} 204}
162 205
163sub err_blocked {
164 my $self = shift;
165 my $ip = $self->{remote_addr};
166 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
167
168 $self->err(403, "too many connections",
169 {
170 "Content-Type" => "text/html",
171 "Retry-After" => $::BLOCKTIME
172 },
173 <<EOF);
174<html><p>
175You have been blocked because you opened too many connections. You
176may retry at</p>
177
178 <p><blockquote>$time.</blockquote></p>
179
180<p>Until then, each new access will renew the block. You might want to have a
181look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
182</html>
183EOF
184}
185
186sub handle { 206sub handle {
187 my $self = shift; 207 my $self = shift;
188 my $fh = $self->{fh}; 208 my $fh = $self->{fh};
189 209
210 my $host;
211
212 $fh->timeout($::REQ_TIMEOUT);
190 #while() { 213 while() {
214 $self->{reqs}++;
215
216 # read request and parse first line
217 my $req = $fh->readline("\015\012\015\012");
218
219 unless (defined $req) {
220 if (exists $self->{version}) {
221 last;
222 } else {
223 $self->err(408, "request timeout");
224 }
225 }
226
191 $self->{h} = {}; 227 $self->{h} = {};
192 228
193 # read request and parse first line
194 $fh->timeout($::REQ_TIMEOUT);
195 my $req = $fh->readline("\015\012\015\012");
196 $fh->timeout($::RES_TIMEOUT); 229 $fh->timeout($::RES_TIMEOUT);
197
198 defined $req or
199 $self->err(408, "request timeout");
200
201 my $ip = $self->{remote_addr};
202
203 if ($blocked{$ip}) {
204 $self->err_blocked($blocked{$ip})
205 if $blocked{$ip} > $::NOW;
206
207 delete $blocked{$ip};
208 }
209
210 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
211 $self->slog(2, "blocked ip $ip");
212 $self->err_blocked;
213 }
214 230
215 $req =~ /^(?:\015\012)? 231 $req =~ /^(?:\015\012)?
216 (GET|HEAD) \040+ 232 (GET|HEAD) \040+
217 ([^\040]+) \040+ 233 ([^\040]+) \040+
218 HTTP\/([0-9]+\.[0-9]+) 234 HTTP\/([0-9]+\.[0-9]+)
219 \015\012/gx 235 \015\012/gx
220 or $self->err(403, "method not allowed", { Allow => "GET,HEAD" }); 236 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
221
222 $2 ne "1.0"
223 or $self->err(506, "http protocol version not supported");
224 237
225 $self->{method} = $1; 238 $self->{method} = $1;
226 $self->{uri} = $2; 239 $self->{uri} = $2;
240 $self->{version} = $3;
241
242 $3 =~ /^1\./
243 or $self->err(506, "http protocol version $3 not supported");
227 244
228 # parse headers 245 # parse headers
229 { 246 {
230 my (%hdr, $h, $v); 247 my (%hdr, $h, $v);
231 248
242 259
243 $self->{h}{$h} = substr $v, 1 260 $self->{h}{$h} = substr $v, 1
244 while ($h, $v) = each %hdr; 261 while ($h, $v) = each %hdr;
245 } 262 }
246 263
264 # remote id should be unique per user
265 my $id = $self->{remote_addr};
266
267 if (exists $self->{h}{"client-ip"}) {
268 $id .= "[".$self->{h}{"client-ip"}."]";
269 } elsif (exists $self->{h}{"x-forwarded-for"}) {
270 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
271 }
272
273 $self->{remote_id} = $id;
274
275 if ($blocked{$id}) {
276 $self->err_blocked($blocked{$id})
277 if $blocked{$id} > $::NOW;
278
279 delete $blocked{$id};
280 }
281
282 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
283 my $delay = $::PER_TIMEOUT + 15;
284 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
285 if ($delay <= 0) {
286 $self->slog(2, "blocked ip $id");
287 $self->err_blocked;
288 } else {
289 Coro::Event::do_timer(after => 4); $delay -= 4;
290 }
291 }
292 }
293
294 # find out server name and port
295 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
296 $host = $1;
297 } else {
298 $host = $self->{h}{host};
299 }
300
301 if (defined $host) {
247 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80; 302 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
303 } else {
304 ($self->{server_port}, $host)
305 = unpack_sockaddr_in $self->{fh}->getsockname
306 or $self->err(500, "unable to get socket name");
307 $host = inet_ntoa $host;
308 }
248 309
310 $self->{server_name} = $host;
311
312 # enter ourselves into various lists
313 weaken ($conn{$id}{$self*1} = $self);
249 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self); 314 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self);
250 315
316 eval {
251 $self->map_uri; 317 $self->map_uri;
252 $self->respond; 318 $self->respond;
319 };
320
321 $self->eoconn;
322
323 die if $@ && !ref $@;
324
325 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1;
326
327 $fh->timeout($::PER_TIMEOUT);
253 #} 328 }
254} 329}
255 330
256# uri => path mapping 331# uri => path mapping
257sub map_uri { 332sub map_uri {
258 my $self = shift; 333 my $self = shift;
259 my $host = $self->{h}{host} || "default"; 334 my $host = $self->{server_name};
260 my $uri = $self->{uri}; 335 my $uri = $self->{uri};
261 336
262 # some massaging, also makes it more secure 337 # some massaging, also makes it more secure
263 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; 338 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
264 $uri =~ s%//+%/%g; 339 $uri =~ s%//+%/%g;
274 $self->{path} = "$::DOCROOT/$host$uri"; 349 $self->{path} = "$::DOCROOT/$host$uri";
275 350
276 $self->access_check; 351 $self->access_check;
277} 352}
278 353
279sub server_address {
280 my $self = shift;
281 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
282 or $self->err(500, "unable to get socket name");
283 ((inet_ntoa $iaddr), $port);
284}
285
286sub server_host {
287 my $self = shift;
288 if (exists $self->{h}{host}) {
289 return $self->{h}{host};
290 } else {
291 return (($self->server_address)[0]);
292 }
293}
294
295sub server_hostport {
296 my $self = shift;
297 my ($host, $port);
298 if (exists $self->{h}{host}) {
299 ($host, $port) = ($self->{h}{host}, $self->{server_port});
300 } else {
301 ($host, $port) = $self->server_address;
302 }
303 $port = $port == 80 ? "" : ":$port";
304 $host.$port;
305}
306
307sub _cgi { 354sub _cgi {
308 my $self = shift; 355 my $self = shift;
309 my $path = shift; 356 my $path = shift;
310 my $fh; 357 my $fh;
311 358
312 # no two-way xxx supported 359 # no two-way xxx supported
313 if (0 == fork) { 360 if (0 == fork) {
314 open STDOUT, ">&".fileno($self->{fh}); 361 open STDOUT, ">&".fileno($self->{fh});
315 if (chdir $::DOCROOT) { 362 if (chdir $::DOCROOT) {
316 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike 363 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
317 $ENV{HTTP_HOST} = $self->server_host; 364 $ENV{HTTP_HOST} = $self->{server_name};
318 $ENV{HTTP_PORT} = $self->{server_host}; 365 $ENV{HTTP_PORT} = $self->{server_port};
319 $ENV{SCRIPT_NAME} = $self->{name}; 366 $ENV{SCRIPT_NAME} = $self->{name};
320 exec $path; 367 exec $path;
321 } 368 }
322 Coro::State::_exit(0); 369 Coro::State::_exit(0);
323 } else { 370 } else {
371 die;
324 } 372 }
373}
374
375sub server_hostport {
376 $_[0]{server_port} == 80
377 ? $_[0]{server_name}
378 : "$_[0]{server_name}:$_[0]{server_port}";
325} 379}
326 380
327sub respond { 381sub respond {
328 my $self = shift; 382 my $self = shift;
329 my $path = $self->{path}; 383 my $path = $self->{path};
339 393
340 if (-d _ && -r _) { 394 if (-d _ && -r _) {
341 # directory 395 # directory
342 if ($path !~ /\/$/) { 396 if ($path !~ /\/$/) {
343 # create a redirect to get the trailing "/" 397 # create a redirect to get the trailing "/"
344 my $host = $self->server_hostport; 398 # we don't try to avoid the :80
345 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" }); 399 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
346 } else { 400 } else {
347 $ims < $self->{stat}[9] 401 $ims < $self->{stat}[9]
348 or $self->err(304, "not modified"); 402 or $self->err(304, "not modified");
349 403
350 if ($self->{method} eq "GET") {
351 if (-r "$path/index.html") { 404 if (-r "$path/index.html") {
352 $self->{path} .= "/index.html"; 405 $self->{path} .= "/index.html";
353 $self->handle_file; 406 $self->handle_file;
354 } else { 407 } else {
355 $self->handle_dir; 408 $self->handle_dir;
356 }
357 } 409 }
358 } 410 }
359 } elsif (-f _ && -r _) { 411 } elsif (-f _ && -r _) {
360 -x _ and $self->err(403, "forbidden"); 412 -x _ and $self->err(403, "forbidden");
361 $self->handle_file; 413 $self->handle_file;
376 $idx); 428 $idx);
377} 429}
378 430
379sub handle_file { 431sub handle_file {
380 my $self = shift; 432 my $self = shift;
381 my $length = -s _; 433 my $length = $self->{stat}[7];
434 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
382 my $hdr = { 435 my $hdr = {
383 "Last-Modified" => time2str ((stat _)[9]), 436 "Last-Modified" => time2str ((stat _)[9]),
384 }; 437 };
385 438
386 my @code = (200, "ok"); 439 my @code = (200, "ok");
394 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1); 447 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
395 } else { 448 } else {
396 ($l, $h) = (0, $length - 1); 449 ($l, $h) = (0, $length - 1);
397 goto ignore; 450 goto ignore;
398 } 451 }
399 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l; 452 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
400 } 453 }
401 $hdr->{"Content-Range"} = "bytes */$length"; 454 $hdr->{"Content-Range"} = "bytes */$length";
455 $hdr->{"Content-Length"} = $length;
402 $self->err(416, "not satisfiable", $hdr); 456 $self->err(416, "not satisfiable", $hdr, "");
403 457
404satisfiable: 458satisfiable:
405 # check for segmented downloads 459 # check for segmented downloads
406 if ($l && $::NO_SEGMENTED) { 460 if ($l && $::NO_SEGMENTED) {
461 my $delay = $::PER_TIMEOUT + 15;
407 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) { 462 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
408 $self->err(400, "segmented downloads are not allowed"); 463 if ($delay <= 0) {
464 $self->err_segmented_download;
465 } else {
466 Coro::Event::do_timer(after => 4); $delay -= 4;
467 }
409 } 468 }
410 } 469 }
411 470
412 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 471 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
413 @code = (206, "partial content"); 472 @code = (206, "partial content");
423 $hdr->{"Content-Length"} = $length; 482 $hdr->{"Content-Length"} = $length;
424 483
425 $self->response(@code, $hdr, ""); 484 $self->response(@code, $hdr, "");
426 485
427 if ($self->{method} eq "GET") { 486 if ($self->{method} eq "GET") {
487 $self->{time} = $::NOW;
488
489 my $fudge = $queue->[0]->waiters;
490 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
491
492 $queue->[1] *= $fudge;
493 my $transfer = $queue->[0]->guard;
494
495 if ($fudge != 1) {
496 $queue->[1] /= $fudge;
497 $queue->[1] = $queue->[1] * $::wait_factor
498 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
499 }
500 $self->{time} = $::NOW;
501
502 $self->{fh}->writable or return;
503
428 my ($fh, $buf); 504 my ($fh, $buf, $r);
505 my $current = $Coro::current;
429 open $fh, "<", $self->{path} 506 open $fh, "<", $self->{path}
430 or die "$self->{path}: late open failure ($!)"; 507 or die "$self->{path}: late open failure ($!)";
431 508
432 if ($l) {
433 sysseek $fh, $l, 0
434 or die "$self->{path}: cannot seek to $l ($!)";
435 }
436
437 $h -= $l - 1; 509 $h -= $l - 1;
438 510
511 if (0) {
512 if ($l) {
513 sysseek $fh, $l, 0;
514 }
515 }
516
439 while ($h > 0) { 517 while ($h > 0) {
518 if (0) {
440 $h -= sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h; 519 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
441 my $w = $self->{fh}->syswrite($buf) 520 or last;
521 } else {
522 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
523 $buf, 0, sub {
524 $r = $_[0];
525 Coro::ready($current);
526 });
527 &Coro::schedule;
528 last unless $r;
529 }
530 my $w = syswrite $self->{fh}, $buf
442 or last; 531 or last;
443 $::written += $w; 532 $::written += $w;
444 $self->{written} += $w; 533 $self->{written} += $w;
534 $l += $r;
445 } 535 }
446 }
447 536
448 close $fh; 537 close $fh;
538 }
449} 539}
450 540
4511; 5411;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines