ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing cvsroot/Coro/myhttpd/httpd.pl (file contents):
Revision 1.14 by root, Sun Aug 12 14:09:03 2001 UTC vs.
Revision 1.36 by root, Sun Sep 2 00:54:00 2001 UTC

1use Coro; 1use Coro;
2use Coro::Semaphore; 2use Coro::Semaphore;
3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5 5
6use HTTP::Date;
7
6no utf8; 8no utf8;
7use bytes; 9use bytes;
8 10
9# at least on my machine, this thingy serves files 11# at least on my machine, this thingy serves files
10# quite a bit faster than apache, ;) 12# quite a bit faster than apache, ;)
11# and quite a bit slower than thttpd :( 13# and quite a bit slower than thttpd :(
12 14
13$SIG{PIPE} = 'IGNORE'; 15$SIG{PIPE} = 'IGNORE';
14 16
17our $accesslog;
18
19if ($ACCESS_LOG) {
20 use IO::Handle;
21 open $accesslog, ">>$ACCESS_LOG"
22 or die "$ACCESS_LOG: $!";
23 $accesslog->autoflush(1);
24}
25
15sub slog { 26sub slog {
16 my $level = shift; 27 my $level = shift;
17 my $format = shift; 28 my $format = shift;
18 printf "---: $format\n", @_; 29 printf "---: $format\n", @_;
19} 30}
20 31
21my $connections = new Coro::Semaphore $MAX_CONNECTS; 32our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
33
34our $wait_factor = 0.95;
35
36our @transfers = (
37 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1],
38 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1],
39);
22 40
23my @newcons; 41my @newcons;
24my @pool; 42my @pool;
25 43
26# one "execution thread" 44# one "execution thread"
48 Listen => 50, 66 Listen => 50,
49 or die "unable to start server"; 67 or die "unable to start server";
50 68
51push @listen_sockets, $http_port; 69push @listen_sockets, $http_port;
52 70
71our $NOW;
72our $HTTP_NOW;
73
74Event->timer(interval => 1, hard => 1, cb => sub {
75 $NOW = time;
76 $HTTP_NOW = time2str $NOW;
77})->now;
78
53# the "main thread" 79# the "main thread"
54async { 80async {
55 slog 1, "accepting connections"; 81 slog 1, "accepting connections";
56 while () { 82 while () {
57 $connections->down; 83 $connections->down;
58 push @newcons, [$http_port->accept]; 84 push @newcons, [$http_port->accept];
59 #slog 3, "accepted @$connections ".scalar(@pool); 85 #slog 3, "accepted @$connections ".scalar(@pool);
60 $::NOW = time;
61 if (@pool) { 86 if (@pool) {
62 (pop @pool)->ready; 87 (pop @pool)->ready;
63 } else { 88 } else {
64 async \&handler; 89 async \&handler;
65 } 90 }
70package conn; 95package conn;
71 96
72use Socket; 97use Socket;
73use HTTP::Date; 98use HTTP::Date;
74use Convert::Scalar 'weaken'; 99use Convert::Scalar 'weaken';
100use Linux::AIO;
75 101
102Linux::AIO::min_parallel $::AIO_PARALLEL;
103
104my $aio_requests = new Coro::Semaphore $::AIO_PARALLEL * 4;
105
106Event->io(fd => Linux::AIO::poll_fileno,
107 poll => 'r', async => 1,
108 cb => \&Linux::AIO::poll_cb);
109
76our %conn; # $conn{ip}{fh} => connobj 110our %conn; # $conn{ip}{self} => connobj
111our %uri; # $uri{ip}{uri}{self}
77our %blocked; 112our %blocked;
78our %mimetype; 113our %mimetype;
79 114
80sub read_mimetypes { 115sub read_mimetypes {
81 local *M; 116 local *M;
101 or $self->err(500, "unable to decode peername"); 136 or $self->err(500, "unable to decode peername");
102 137
103 $self->{remote_addr} = inet_ntoa $iaddr; 138 $self->{remote_addr} = inet_ntoa $iaddr;
104 $self->{time} = $::NOW; 139 $self->{time} = $::NOW;
105 140
106 # enter ourselves into various lists
107 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
108
109 $::conns++; 141 $::conns++;
110 142
111 $self; 143 $self;
112} 144}
113 145
114sub DESTROY { 146sub DESTROY {
115 my $self = shift; 147 my $self = shift;
116 148
117 $::conns--; 149 $::conns--;
118 150
151 $self->eoconn;
152}
153
154# end of connection
155sub eoconn {
156 my $self = shift;
157
158 # clean up hints
119 delete $conn{$self->{remote_addr}}{$self*1}; 159 delete $conn{$self->{remote_id}}{$self*1};
120 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1}; 160 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1};
121} 161}
122 162
123sub slog { 163sub slog {
124 my $self = shift; 164 my $self = shift;
125 main::slog($_[0], "$self->{remote_addr}> $_[1]"); 165 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
126} 166}
127 167
128sub response { 168sub response {
129 my ($self, $code, $msg, $hdr, $content) = @_; 169 my ($self, $code, $msg, $hdr, $content) = @_;
130 my $res = "HTTP/1.0 $code $msg\015\012"; 170 my $res = "HTTP/1.1 $code $msg\015\012";
131 171
132 $res .= "Connection: close\015\012"; 172 $self->{h}{connection} ||= $hdr->{Connection};
133 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( 173
174 $res .= "Date: $HTTP_NOW\015\012";
134 175
135 while (my ($h, $v) = each %$hdr) { 176 while (my ($h, $v) = each %$hdr) {
136 $res .= "$h: $v\015\012" 177 $res .= "$h: $v\015\012"
137 } 178 }
138 $res .= "\015\012"; 179 $res .= "\015\012";
139 180
140 $res .= $content if defined $content and $self->{method} ne "HEAD"; 181 $res .= $content if defined $content and $self->{method} ne "HEAD";
141 182
142 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d# 183 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
184
185 print $accesslog $log if $accesslog;
186 print STDERR $log;
143 187
144 $self->{written} += 188 $self->{written} +=
145 print {$self->{fh}} $res; 189 print {$self->{fh}} $res;
146} 190}
147 191
148sub err { 192sub err {
149 my $self = shift; 193 my $self = shift;
150 my ($code, $msg, $hdr, $content) = @_; 194 my ($code, $msg, $hdr, $content) = @_;
151 195
152 unless (defined $content) { 196 unless (defined $content) {
153 $content = "$code $msg"; 197 $content = "$code $msg\n";
154 $hdr->{"Content-Type"} = "text/plain"; 198 $hdr->{"Content-Type"} = "text/plain";
155 $hdr->{"Content-Length"} = length $content; 199 $hdr->{"Content-Length"} = length $content;
156 } 200 }
201 $hdr->{"Connection"} = "close";
157 202
158 $self->response($code, $msg, $hdr, $content); 203 $self->response($code, $msg, $hdr, $content);
159 204
160 die bless {}, err::; 205 die bless {}, err::;
161} 206}
162 207
163sub err_blocked {
164 my $self = shift;
165 my $ip = $self->{remote_addr};
166 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
167
168 Coro::Event::do_timer(after => 15);
169
170 $self->err(401, "too many connections",
171 {
172 "Content-Type" => "text/html",
173 "Retry-After" => $::BLOCKTIME
174 },
175 <<EOF);
176<html><p>
177You have been blocked because you opened too many connections. You
178may retry at</p>
179
180 <p><blockquote>$time.</blockquote></p>
181
182<p>Until then, each new access will renew the block. You might want to have a
183look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
184</html>
185EOF
186}
187
188sub handle { 208sub handle {
189 my $self = shift; 209 my $self = shift;
190 my $fh = $self->{fh}; 210 my $fh = $self->{fh};
191 211
212 my $host;
213
214 $fh->timeout($::REQ_TIMEOUT);
192 #while() { 215 while() {
216 $self->{reqs}++;
217
218 # read request and parse first line
219 my $req = $fh->readline("\015\012\015\012");
220
221 unless (defined $req) {
222 if (exists $self->{version}) {
223 last;
224 } else {
225 $self->err(408, "request timeout");
226 }
227 }
228
193 $self->{h} = {}; 229 $self->{h} = {};
194 230
195 # read request and parse first line
196 $fh->timeout($::REQ_TIMEOUT);
197 my $req = $fh->readline("\015\012\015\012");
198 $fh->timeout($::RES_TIMEOUT); 231 $fh->timeout($::RES_TIMEOUT);
199
200 defined $req or
201 $self->err(408, "request timeout");
202
203 my $ip = $self->{remote_addr};
204
205 $self->err_blocked($blocked{$ip});
206 if ($blocked{$ip}) {
207 $self->err_blocked($blocked{$ip})
208 if $blocked{$ip} > $::NOW;
209
210 delete $blocked{$ip};
211 }
212
213 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
214 $self->slog(2, "blocked ip $ip");
215 $self->err_blocked;
216 }
217 232
218 $req =~ /^(?:\015\012)? 233 $req =~ /^(?:\015\012)?
219 (GET|HEAD) \040+ 234 (GET|HEAD) \040+
220 ([^\040]+) \040+ 235 ([^\040]+) \040+
221 HTTP\/([0-9]+\.[0-9]+) 236 HTTP\/([0-9]+\.[0-9]+)
222 \015\012/gx 237 \015\012/gx
223 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" }); 238 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
224 239
225 $2 ne "1.0"
226 or $self->err(506, "http protocol version not supported");
227
228 $self->{method} = $1; 240 $self->{method} = $1;
229 $self->{uri} = $2; 241 $self->{uri} = $2;
242 $self->{version} = $3;
243
244 $3 =~ /^1\./
245 or $self->err(506, "http protocol version $3 not supported");
230 246
231 # parse headers 247 # parse headers
232 { 248 {
233 my (%hdr, $h, $v); 249 my (%hdr, $h, $v);
234 250
245 261
246 $self->{h}{$h} = substr $v, 1 262 $self->{h}{$h} = substr $v, 1
247 while ($h, $v) = each %hdr; 263 while ($h, $v) = each %hdr;
248 } 264 }
249 265
266 # remote id should be unique per user
267 my $id = $self->{remote_addr};
268
269 if (exists $self->{h}{"client-ip"}) {
270 $id .= "[".$self->{h}{"client-ip"}."]";
271 } elsif (exists $self->{h}{"x-forwarded-for"}) {
272 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
273 }
274
275 $self->{remote_id} = $id;
276
277 if ($blocked{$id}) {
278 $self->err_blocked($blocked{$id})
279 if $blocked{$id} > $::NOW;
280
281 delete $blocked{$id};
282 }
283
284 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
285 my $delay = $::PER_TIMEOUT + 15;
286 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
287 if ($delay <= 0) {
288 $self->slog(2, "blocked ip $id");
289 $self->err_blocked;
290 } else {
291 Coro::Event::do_timer(after => 4); $delay -= 4;
292 }
293 }
294 }
295
296 # find out server name and port
297 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
298 $host = $1;
299 } else {
300 $host = $self->{h}{host};
301 }
302
303 if (defined $host) {
250 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80; 304 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
305 } else {
306 ($self->{server_port}, $host)
307 = unpack_sockaddr_in $self->{fh}->getsockname
308 or $self->err(500, "unable to get socket name");
309 $host = inet_ntoa $host;
310 }
251 311
312 $self->{server_name} = $host;
313
314 # enter ourselves into various lists
315 weaken ($conn{$id}{$self*1} = $self);
252 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self); 316 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self);
253 317
318 eval {
254 $self->map_uri; 319 $self->map_uri;
255 $self->respond; 320 $self->respond;
321 };
322
323 $self->eoconn;
324
325 die if $@ && !ref $@;
326
327 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1;
328
329 $fh->timeout($::PER_TIMEOUT);
256 #} 330 }
257} 331}
258 332
259# uri => path mapping 333# uri => path mapping
260sub map_uri { 334sub map_uri {
261 my $self = shift; 335 my $self = shift;
262 my $host = $self->{h}{host} || "default"; 336 my $host = $self->{server_name};
263 my $uri = $self->{uri}; 337 my $uri = $self->{uri};
264 338
265 # some massaging, also makes it more secure 339 # some massaging, also makes it more secure
266 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; 340 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
267 $uri =~ s%//+%/%g; 341 $uri =~ s%//+%/%g;
277 $self->{path} = "$::DOCROOT/$host$uri"; 351 $self->{path} = "$::DOCROOT/$host$uri";
278 352
279 $self->access_check; 353 $self->access_check;
280} 354}
281 355
282sub server_address {
283 my $self = shift;
284 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
285 or $self->err(500, "unable to get socket name");
286 ((inet_ntoa $iaddr), $port);
287}
288
289sub server_host {
290 my $self = shift;
291 if (exists $self->{h}{host}) {
292 return $self->{h}{host};
293 } else {
294 return (($self->server_address)[0]);
295 }
296}
297
298sub server_hostport {
299 my $self = shift;
300 my ($host, $port);
301 if (exists $self->{h}{host}) {
302 ($host, $port) = ($self->{h}{host}, $self->{server_port});
303 } else {
304 ($host, $port) = $self->server_address;
305 }
306 $port = $port == 80 ? "" : ":$port";
307 $host.$port;
308}
309
310sub _cgi { 356sub _cgi {
311 my $self = shift; 357 my $self = shift;
312 my $path = shift; 358 my $path = shift;
313 my $fh; 359 my $fh;
314 360
315 # no two-way xxx supported 361 # no two-way xxx supported
316 if (0 == fork) { 362 if (0 == fork) {
317 open STDOUT, ">&".fileno($self->{fh}); 363 open STDOUT, ">&".fileno($self->{fh});
318 if (chdir $::DOCROOT) { 364 if (chdir $::DOCROOT) {
319 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike 365 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
320 $ENV{HTTP_HOST} = $self->server_host; 366 $ENV{HTTP_HOST} = $self->{server_name};
321 $ENV{HTTP_PORT} = $self->{server_host}; 367 $ENV{HTTP_PORT} = $self->{server_port};
322 $ENV{SCRIPT_NAME} = $self->{name}; 368 $ENV{SCRIPT_NAME} = $self->{name};
323 exec $path; 369 exec $path;
324 } 370 }
325 Coro::State::_exit(0); 371 Coro::State::_exit(0);
326 } else { 372 } else {
373 die;
327 } 374 }
375}
376
377sub server_hostport {
378 $_[0]{server_port} == 80
379 ? $_[0]{server_name}
380 : "$_[0]{server_name}:$_[0]{server_port}";
328} 381}
329 382
330sub respond { 383sub respond {
331 my $self = shift; 384 my $self = shift;
332 my $path = $self->{path}; 385 my $path = $self->{path};
342 395
343 if (-d _ && -r _) { 396 if (-d _ && -r _) {
344 # directory 397 # directory
345 if ($path !~ /\/$/) { 398 if ($path !~ /\/$/) {
346 # create a redirect to get the trailing "/" 399 # create a redirect to get the trailing "/"
347 my $host = $self->server_hostport; 400 # we don't try to avoid the :80
348 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" }); 401 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
349 } else { 402 } else {
350 $ims < $self->{stat}[9] 403 $ims < $self->{stat}[9]
351 or $self->err(304, "not modified"); 404 or $self->err(304, "not modified");
352 405
353 if ($self->{method} eq "GET") {
354 if (-r "$path/index.html") { 406 if (-r "$path/index.html") {
355 $self->{path} .= "/index.html"; 407 $self->{path} .= "/index.html";
356 $self->handle_file; 408 $self->handle_file;
357 } else { 409 } else {
358 $self->handle_dir; 410 $self->handle_dir;
359 }
360 } 411 }
361 } 412 }
362 } elsif (-f _ && -r _) { 413 } elsif (-f _ && -r _) {
363 -x _ and $self->err(403, "forbidden"); 414 -x _ and $self->err(403, "forbidden");
364 $self->handle_file; 415 $self->handle_file;
379 $idx); 430 $idx);
380} 431}
381 432
382sub handle_file { 433sub handle_file {
383 my $self = shift; 434 my $self = shift;
384 my $length = -s _; 435 my $length = $self->{stat}[7];
436 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
385 my $hdr = { 437 my $hdr = {
386 "Last-Modified" => time2str ((stat _)[9]), 438 "Last-Modified" => time2str ((stat _)[9]),
387 }; 439 };
388 440
389 my @code = (200, "ok"); 441 my @code = (200, "ok");
397 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1); 449 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
398 } else { 450 } else {
399 ($l, $h) = (0, $length - 1); 451 ($l, $h) = (0, $length - 1);
400 goto ignore; 452 goto ignore;
401 } 453 }
402 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l; 454 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
403 } 455 }
404 $hdr->{"Content-Range"} = "bytes */$length"; 456 $hdr->{"Content-Range"} = "bytes */$length";
457 $hdr->{"Content-Length"} = $length;
405 $self->err(416, "not satisfiable", $hdr); 458 $self->err(416, "not satisfiable", $hdr, "");
406 459
407satisfiable: 460satisfiable:
408 # check for segmented downloads 461 # check for segmented downloads
409 if ($l && $::NO_SEGMENTED) { 462 if ($l && $::NO_SEGMENTED) {
463 my $delay = $::PER_TIMEOUT + 15;
410 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) { 464 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
465 if ($delay <= 0) {
466 $self->err_segmented_download;
467 } else {
411 Coro::Event::do_timer(after => 15); 468 Coro::Event::do_timer(after => 4); $delay -= 4;
412 469 }
413 $self->err(400, "segmented downloads are not allowed");
414 } 470 }
415 } 471 }
416 472
417 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 473 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
418 @code = (206, "partial content"); 474 @code = (206, "partial content");
428 $hdr->{"Content-Length"} = $length; 484 $hdr->{"Content-Length"} = $length;
429 485
430 $self->response(@code, $hdr, ""); 486 $self->response(@code, $hdr, "");
431 487
432 if ($self->{method} eq "GET") { 488 if ($self->{method} eq "GET") {
489 $self->{time} = $::NOW;
490
491 my $fudge = $queue->[0]->waiters;
492 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
493
494 $queue->[1] *= $fudge;
495 my $transfer = $queue->[0]->guard;
496
497 if ($fudge != 1) {
498 $queue->[1] /= $fudge;
499 $queue->[1] = $queue->[1] * $::wait_factor
500 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
501 }
502 $self->{time} = $::NOW;
503
504 $self->{fh}->writable or return;
505
433 my ($fh, $buf); 506 my ($fh, $buf, $r);
507 my $current = $Coro::current;
434 open $fh, "<", $self->{path} 508 open $fh, "<", $self->{path}
435 or die "$self->{path}: late open failure ($!)"; 509 or die "$self->{path}: late open failure ($!)";
436 510
437 if ($l) {
438 sysseek $fh, $l, 0
439 or die "$self->{path}: cannot seek to $l ($!)";
440 }
441
442 $h -= $l - 1; 511 $h -= $l - 1;
443 512
513 if (0) {
514 if ($l) {
515 sysseek $fh, $l, 0;
516 }
517 }
518
444 while ($h > 0) { 519 while ($h > 0) {
520 if (0) {
445 $h -= sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h; 521 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
522 or last;
523 } else {
524 undef $buf;
525 $aio_requests->down;
526 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
527 $buf, 0, sub {
528 $r = $_[0];
529 $current->ready;
530 });
531 &Coro::schedule;
532 $aio_requests->up;
533 last unless $r;
534 }
446 my $w = $self->{fh}->syswrite($buf) 535 my $w = $self->{fh}->syswrite($buf)
447 or last; 536 or last;
448 $::written += $w; 537 $::written += $w;
449 $self->{written} += $w; 538 $self->{written} += $w;
539 $l += $r;
450 } 540 }
451 }
452 541
453 close $fh; 542 close $fh;
543 }
454} 544}
455 545
4561; 5461;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines