ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing Coro/myhttpd/httpd.pl (file contents):
Revision 1.12 by root, Sat Aug 11 23:10:56 2001 UTC vs.
Revision 1.34 by root, Thu Aug 30 02:58:17 2001 UTC

1use Coro; 1use Coro;
2use Coro::Semaphore; 2use Coro::Semaphore;
3use Coro::Event; 3use Coro::Event;
4use Coro::Socket; 4use Coro::Socket;
5 5
6use HTTP::Date;
7
6no utf8; 8no utf8;
7use bytes; 9use bytes;
8 10
9# at least on my machine, this thingy serves files 11# at least on my machine, this thingy serves files
10# quite a bit faster than apache, ;) 12# quite a bit faster than apache, ;)
11# and quite a bit slower than thttpd :( 13# and quite a bit slower than thttpd :(
12 14
13$SIG{PIPE} = 'IGNORE'; 15$SIG{PIPE} = 'IGNORE';
14 16
17our $accesslog;
18
19if ($ACCESS_LOG) {
20 use IO::Handle;
21 open $accesslog, ">>$ACCESS_LOG"
22 or die "$ACCESS_LOG: $!";
23 $accesslog->autoflush(1);
24}
25
15sub slog { 26sub slog {
16 my $level = shift; 27 my $level = shift;
17 my $format = shift; 28 my $format = shift;
18 printf "---: $format\n", @_; 29 printf "---: $format\n", @_;
19} 30}
20 31
21my $connections = new Coro::Semaphore $MAX_CONNECTS; 32our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
33
34our $wait_factor = 0.95;
35
36our @transfers = (
37 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 600],
38 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 600],
39);
22 40
23my @newcons; 41my @newcons;
24my @pool; 42my @pool;
25 43
26# one "execution thread" 44# one "execution thread"
43 61
44my $http_port = new Coro::Socket 62my $http_port = new Coro::Socket
45 LocalAddr => $SERVER_HOST, 63 LocalAddr => $SERVER_HOST,
46 LocalPort => $SERVER_PORT, 64 LocalPort => $SERVER_PORT,
47 ReuseAddr => 1, 65 ReuseAddr => 1,
48 Listen => 1, 66 Listen => 50,
49 or die "unable to start server"; 67 or die "unable to start server";
50 68
51push @listen_sockets, $http_port; 69push @listen_sockets, $http_port;
70
71our $NOW;
72our $HTTP_NOW;
73
74Event->timer(interval => 1, hard => 1, cb => sub {
75 $NOW = time;
76 $HTTP_NOW = time2str $NOW;
77})->now;
52 78
53# the "main thread" 79# the "main thread"
54async { 80async {
55 slog 1, "accepting connections"; 81 slog 1, "accepting connections";
56 while () { 82 while () {
57 $connections->down; 83 $connections->down;
58 push @newcons, [$http_port->accept]; 84 push @newcons, [$http_port->accept];
59 #slog 3, "accepted @$connections ".scalar(@pool); 85 #slog 3, "accepted @$connections ".scalar(@pool);
60 $::NOW = time;
61 if (@pool) { 86 if (@pool) {
62 (pop @pool)->ready; 87 (pop @pool)->ready;
63 } else { 88 } else {
64 async \&handler; 89 async \&handler;
65 } 90 }
70package conn; 95package conn;
71 96
72use Socket; 97use Socket;
73use HTTP::Date; 98use HTTP::Date;
74use Convert::Scalar 'weaken'; 99use Convert::Scalar 'weaken';
100use Linux::AIO;
75 101
102Linux::AIO::min_parallel $::AIO_PARALLEL;
103
104my $aio_requests = new Coro::Semaphore $::AIO_PARALLEL * 4;
105
106Event->io(fd => Linux::AIO::poll_fileno,
107 poll => 'r', async => 1,
108 cb => \&Linux::AIO::poll_cb);
109
76our %conn; # $conn{ip}{fh} => connobj 110our %conn; # $conn{ip}{self} => connobj
111our %uri; # $uri{ip}{uri}{self}
77our %blocked; 112our %blocked;
78our %mimetype; 113our %mimetype;
79 114
80sub read_mimetypes { 115sub read_mimetypes {
81 local *M; 116 local *M;
104 $self->{time} = $::NOW; 139 $self->{time} = $::NOW;
105 140
106 # enter ourselves into various lists 141 # enter ourselves into various lists
107 weaken ($conn{$self->{remote_addr}}{$self*1} = $self); 142 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
108 143
144 $::conns++;
145
109 $self; 146 $self;
110} 147}
111 148
112sub DESTROY { 149sub DESTROY {
113 my $self = shift; 150 my $self = shift;
151
152 $::conns--;
153
154 $self->eoconn;
114 delete $conn{$self->{remote_addr}}{$self*1}; 155 delete $conn{$self->{remote_addr}}{$self*1};
156}
157
158# end of connection
159sub eoconn {
160 my $self = shift;
115 delete $uri{$self->{uri}}{$self*1}; 161 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
116} 162}
117 163
118sub slog { 164sub slog {
119 my $self = shift; 165 my $self = shift;
120 main::slog($_[0], "$self->{remote_addr}> $_[1]"); 166 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
121} 167}
122 168
123sub response { 169sub response {
124 my ($self, $code, $msg, $hdr, $content) = @_; 170 my ($self, $code, $msg, $hdr, $content) = @_;
125 my $res = "HTTP/1.0 $code $msg\015\012"; 171 my $res = "HTTP/1.1 $code $msg\015\012";
126 172
127 $res .= "Connection: close\015\012"; 173 $self->{h}{connection} ||= $hdr->{Connection};
128 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( 174
175 $res .= "Date: $HTTP_NOW\015\012";
129 176
130 while (my ($h, $v) = each %$hdr) { 177 while (my ($h, $v) = each %$hdr) {
131 $res .= "$h: $v\015\012" 178 $res .= "$h: $v\015\012"
132 } 179 }
133 $res .= "\015\012"; 180 $res .= "\015\012";
134 181
135 $res .= $content if defined $content and $self->{method} eq "GET"; 182 $res .= $content if defined $content and $self->{method} ne "HEAD";
136 183
137 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d# 184 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
185
186 print $accesslog $log if $accesslog;
187 print STDERR $log;
138 188
139 $self->{written} += 189 $self->{written} +=
140 print {$self->{fh}} $res; 190 print {$self->{fh}} $res;
141} 191}
142 192
147 unless (defined $content) { 197 unless (defined $content) {
148 $content = "$code $msg"; 198 $content = "$code $msg";
149 $hdr->{"Content-Type"} = "text/plain"; 199 $hdr->{"Content-Type"} = "text/plain";
150 $hdr->{"Content-Length"} = length $content; 200 $hdr->{"Content-Length"} = length $content;
151 } 201 }
202 $hdr->{"Connection"} = "close";
152 203
153 $self->response($code, $msg, $hdr, $content); 204 $self->response($code, $msg, $hdr, $content);
154 205
155 die bless {}, err::; 206 die bless {}, err::;
156} 207}
157 208
158sub err_blocked {
159 my $self = shift;
160 my $ip = $self->{remote_addr};
161 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
162
163 Coro::Event::do_timer(after => 5);
164
165 $self->err(403, "too many connections",
166 {
167 "Content-Type" => "text/html",
168 "Retry-After" => $::BLOCKTIME
169 },
170 <<EOF);
171<html><p>
172You have been blocked because you opened too many connections. You
173may retry at</p>
174
175 <p><blockquote>$time.</blockquote></p>
176
177<p>Until then, each new access will renew the block. You might want to have a
178look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
179</html>
180EOF
181}
182
183sub handle { 209sub handle {
184 my $self = shift; 210 my $self = shift;
185 my $fh = $self->{fh}; 211 my $fh = $self->{fh};
186 212
213 my $host;
214
215 $fh->timeout($::REQ_TIMEOUT);
187 #while() { 216 while() {
217 $self->{reqs}++;
218
219 # read request and parse first line
220 my $req = $fh->readline("\015\012\015\012");
221
222 unless (defined $req) {
223 if (exists $self->{version}) {
224 last;
225 } else {
226 $self->err(408, "request timeout");
227 }
228 }
229
188 $self->{h} = {}; 230 $self->{h} = {};
189 231
190 # read request and parse first line
191 $fh->timeout($::REQ_TIMEOUT);
192 my $req = $fh->readline("\015\012\015\012");
193 $fh->timeout($::RES_TIMEOUT); 232 $fh->timeout($::RES_TIMEOUT);
194
195 defined $req or
196 $self->err(408, "request timeout");
197
198 my $ip = $self->{remote_addr}; 233 my $ip = $self->{remote_addr};
199 234
200 if ($blocked{$ip}) { 235 if ($blocked{$ip}) {
201 $self->err_blocked($blocked{$ip}) 236 $self->err_blocked($blocked{$ip})
202 if $blocked{$ip} > $::NOW; 237 if $blocked{$ip} > $::NOW;
203 238
204 delete $blocked{$ip}; 239 delete $blocked{$ip};
205 } 240 }
206 241
207 if (%{$conn{$ip}} > $::MAX_CONN_IP) { 242 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
243 my $delay = 120;
244 while (%{$conn{$ip}} > $::MAX_CONN_IP) {
245 if ($delay <= 0) {
208 $self->slog(2, "blocked ip $ip"); 246 $self->slog(2, "blocked ip $ip");
209 $self->err_blocked; 247 $self->err_blocked;
248 } else {
249 Coro::Event::do_timer(after => 3);
250 $delay -= 3;
251 }
252 }
210 } 253 }
211 254
212 $req =~ /^(?:\015\012)? 255 $req =~ /^(?:\015\012)?
213 (GET|HEAD) \040+ 256 (GET|HEAD) \040+
214 ([^\040]+) \040+ 257 ([^\040]+) \040+
215 HTTP\/([0-9]+\.[0-9]+) 258 HTTP\/([0-9]+\.[0-9]+)
216 \015\012/gx 259 \015\012/gx
217 or $self->err(403, "method not allowed", { Allow => "GET,HEAD" }); 260 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
218
219 $2 ne "1.0"
220 or $self->err(506, "http protocol version not supported");
221 261
222 $self->{method} = $1; 262 $self->{method} = $1;
223 $self->{uri} = $2; 263 $self->{uri} = $2;
264 $self->{version} = $3;
265
266 $3 =~ /^1\./
267 or $self->err(506, "http protocol version $3 not supported");
224 268
225 # parse headers 269 # parse headers
226 { 270 {
227 my (%hdr, $h, $v); 271 my (%hdr, $h, $v);
228 272
239 283
240 $self->{h}{$h} = substr $v, 1 284 $self->{h}{$h} = substr $v, 1
241 while ($h, $v) = each %hdr; 285 while ($h, $v) = each %hdr;
242 } 286 }
243 287
288 # find out server name and port
289 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
290 $host = $1;
291 } else {
292 $host = $self->{h}{host};
293 }
294
295 if (defined $host) {
244 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80; 296 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
297 } else {
298 ($self->{server_port}, $host)
299 = unpack_sockaddr_in $self->{fh}->getsockname
300 or $self->err(500, "unable to get socket name");
301 $host = inet_ntoa $host;
302 }
245 303
304 $self->{server_name} = $host;
305
306 # remote id should be unique per user
307 $self->{remote_id} = $self->{remote_addr};
308
309 if (exists $self->{h}{"client-ip"}) {
310 $self->{remote_id} .= "[".$self->{h}{"client-ip"}."]";
311 } elsif (exists $self->{h}{"x-forwarded-for"}) {
312 $self->{remote_id} .= "[".$self->{h}{"x-forwarded-for"}."]";
313 }
314
246 weaken ($uri{$self->{uri}}{$self*1} = $self); 315 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
247 316
317 eval {
248 $self->map_uri; 318 $self->map_uri;
249 $self->respond; 319 $self->respond;
320 };
321
322 $self->eoconn;
323
324 die if $@ && !ref $@;
325
326 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1;
327
328 $fh->timeout($::PER_TIMEOUT);
250 #} 329 }
251} 330}
252 331
253# uri => path mapping 332# uri => path mapping
254sub map_uri { 333sub map_uri {
255 my $self = shift; 334 my $self = shift;
256 my $host = $self->{h}{host} || "default"; 335 my $host = $self->{server_name};
257 my $uri = $self->{uri}; 336 my $uri = $self->{uri};
258 337
259 # some massaging, also makes it more secure 338 # some massaging, also makes it more secure
260 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; 339 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
261 $uri =~ s%//+%/%g; 340 $uri =~ s%//+%/%g;
271 $self->{path} = "$::DOCROOT/$host$uri"; 350 $self->{path} = "$::DOCROOT/$host$uri";
272 351
273 $self->access_check; 352 $self->access_check;
274} 353}
275 354
276sub server_address {
277 my $self = shift;
278 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
279 or $self->err(500, "unable to get socket name");
280 ((inet_ntoa $iaddr), $port);
281}
282
283sub server_host {
284 my $self = shift;
285 if (exists $self->{h}{host}) {
286 return $self->{h}{host};
287 } else {
288 return (($self->server_address)[0]);
289 }
290}
291
292sub server_hostport {
293 my $self = shift;
294 my ($host, $port);
295 if (exists $self->{h}{host}) {
296 ($host, $port) = ($self->{h}{host}, $self->{server_port});
297 } else {
298 ($host, $port) = $self->server_address;
299 }
300 $port = $port == 80 ? "" : ":$port";
301 $host.$port;
302}
303
304sub _cgi { 355sub _cgi {
305 my $self = shift; 356 my $self = shift;
306 my $path = shift; 357 my $path = shift;
307 my $fh; 358 my $fh;
308 359
309 # no two-way xxx supported 360 # no two-way xxx supported
310 if (0 == fork) { 361 if (0 == fork) {
311 open STDOUT, ">&".fileno($self->{fh}); 362 open STDOUT, ">&".fileno($self->{fh});
312 if (chdir $::DOCROOT) { 363 if (chdir $::DOCROOT) {
313 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike 364 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
314 $ENV{HTTP_HOST} = $self->server_host; 365 $ENV{HTTP_HOST} = $self->{server_name};
315 $ENV{HTTP_PORT} = $self->{server_host}; 366 $ENV{HTTP_PORT} = $self->{server_port};
316 $ENV{SCRIPT_NAME} = $self->{name}; 367 $ENV{SCRIPT_NAME} = $self->{name};
317 exec $path; 368 exec $path;
318 } 369 }
319 Coro::State::_exit(0); 370 Coro::State::_exit(0);
320 } else { 371 } else {
372 die;
321 } 373 }
374}
375
376sub server_hostport {
377 $_[0]{server_port} == 80
378 ? $_[0]{server_name}
379 : "$_[0]{server_name}:$_[0]{server_port}";
322} 380}
323 381
324sub respond { 382sub respond {
325 my $self = shift; 383 my $self = shift;
326 my $path = $self->{path}; 384 my $path = $self->{path};
336 394
337 if (-d _ && -r _) { 395 if (-d _ && -r _) {
338 # directory 396 # directory
339 if ($path !~ /\/$/) { 397 if ($path !~ /\/$/) {
340 # create a redirect to get the trailing "/" 398 # create a redirect to get the trailing "/"
341 my $host = $self->server_hostport; 399 # we don't try to avoid the :80
342 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" }); 400 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
343 } else { 401 } else {
344 $ims < $self->{stat}[9] 402 $ims < $self->{stat}[9]
345 or $self->err(304, "not modified"); 403 or $self->err(304, "not modified");
346 404
347 if ($self->{method} eq "GET") {
348 if (-r "$path/index.html") { 405 if (-r "$path/index.html") {
349 $self->{path} .= "/index.html"; 406 $self->{path} .= "/index.html";
350 $self->handle_file; 407 $self->handle_file;
351 } else { 408 } else {
352 $self->handle_dir; 409 $self->handle_dir;
353 }
354 } 410 }
355 } 411 }
356 } elsif (-f _ && -r _) { 412 } elsif (-f _ && -r _) {
357 -x _ and $self->err(403, "forbidden"); 413 -x _ and $self->err(403, "forbidden");
358 $self->handle_file; 414 $self->handle_file;
373 $idx); 429 $idx);
374} 430}
375 431
376sub handle_file { 432sub handle_file {
377 my $self = shift; 433 my $self = shift;
378 my $length = -s _; 434 my $length = $self->{stat}[7];
435 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
379 my $hdr = { 436 my $hdr = {
380 "Last-Modified" => time2str ((stat _)[9]), 437 "Last-Modified" => time2str ((stat _)[9]),
381 }; 438 };
382 439
383 my @code = (200, "ok"); 440 my @code = (200, "ok");
391 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1); 448 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
392 } else { 449 } else {
393 ($l, $h) = (0, $length - 1); 450 ($l, $h) = (0, $length - 1);
394 goto ignore; 451 goto ignore;
395 } 452 }
396 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l; 453 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
397 } 454 }
398 $hdr->{"Content-Range"} = "bytes */$length"; 455 $hdr->{"Content-Range"} = "bytes */$length";
456 $hdr->{"Content-Length"} = $length;
457 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
399 $self->err(416, "not satisfiable", $hdr); 458 $self->err(416, "not satisfiable", $hdr, "");
400 459
401satisfiable: 460satisfiable:
402 # check for segmented downloads 461 # check for segmented downloads
403 if ($l && $::NO_SEGMENTED) { 462 if ($l && $::NO_SEGMENTED) {
404 if (%{$uri{$self->{uri}}} > 1) { 463 my $delay = 180;
405 $self->err(400, "segmented downloads are not allowed"); 464 while (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
465 if ($delay <= 0) {
466 $self->err_segmented_download;
467 } else {
468 Coro::Event::do_timer(after => 3); $delay -= 3;
469 }
406 } 470 }
407 } 471 }
408 472
409 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 473 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
410 @code = (206, "partial content"); 474 @code = (206, "partial content");
420 $hdr->{"Content-Length"} = $length; 484 $hdr->{"Content-Length"} = $length;
421 485
422 $self->response(@code, $hdr, ""); 486 $self->response(@code, $hdr, "");
423 487
424 if ($self->{method} eq "GET") { 488 if ($self->{method} eq "GET") {
489 $self->{time} = $::NOW;
490
491 my $transfer = $queue->[0]->guard;
492 $self->{fh}->writable or return;
493
494 $queue->[1] = $queue->[1] * $::wait_factor
495 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
496 $self->{time} = $::NOW;
497
425 my ($fh, $buf); 498 my ($fh, $buf, $r);
499 my $current = $Coro::current;
426 open $fh, "<", $self->{path} 500 open $fh, "<", $self->{path}
427 or die "$self->{path}: late open failure ($!)"; 501 or die "$self->{path}: late open failure ($!)";
428 502
429 if ($l) {
430 sysseek $fh, $l, 0
431 or die "$self->{path}: cannot seek to $l ($!)";
432 }
433
434 $h -= $l - 1; 503 $h -= $l - 1;
435 504
505 if (0) {
506 if ($l) {
507 sysseek $fh, $l, 0;
508 }
509 }
510
436 while ($h > 0) { 511 while ($h > 0) {
512 if (0) {
437 $h -= sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h; 513 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
514 or last;
515 } else {
516 undef $buf;
517 $aio_requests->down;
518 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
519 $buf, 0, sub {
520 $r = $_[0];
521 $current->ready;
522 });
523 &Coro::schedule;
524 $aio_requests->up;
525 last unless $r;
526 }
438 my $w = $self->{fh}->syswrite($buf) 527 my $w = $self->{fh}->syswrite($buf)
439 or last; 528 or last;
440 $::written += $w; 529 $::written += $w;
441 $self->{written} += $w; 530 $self->{written} += $w;
531 $l += $r;
442 } 532 }
443 }
444 533
445 close $fh; 534 close $fh;
535 }
446} 536}
447 537
4481; 5381;

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines