ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
(Generate patch)

Comparing cvsroot/Coro/myhttpd/httpd.pl (file contents):
Revision 1.9 by root, Sat Aug 11 12:49:21 2001 UTC vs.
Revision 1.29 by root, Sat Aug 25 15:14:03 2001 UTC

9# at least on my machine, this thingy serves files 9# at least on my machine, this thingy serves files
10# quite a bit faster than apache, ;) 10# quite a bit faster than apache, ;)
11# and quite a bit slower than thttpd :( 11# and quite a bit slower than thttpd :(
12 12
13$SIG{PIPE} = 'IGNORE'; 13$SIG{PIPE} = 'IGNORE';
14 14
15our $accesslog;
16
17if ($ACCESS_LOG) {
18 use IO::Handle;
19 open $accesslog, ">>$ACCESS_LOG"
20 or die "$ACCESS_LOG: $!";
21 $accesslog->autoflush(1);
22}
23
15sub slog { 24sub slog {
16 my $level = shift; 25 my $level = shift;
17 my $format = shift; 26 my $format = shift;
18 printf "---: $format\n", @_; 27 printf "---: $format\n", @_;
19} 28}
43 52
44my $http_port = new Coro::Socket 53my $http_port = new Coro::Socket
45 LocalAddr => $SERVER_HOST, 54 LocalAddr => $SERVER_HOST,
46 LocalPort => $SERVER_PORT, 55 LocalPort => $SERVER_PORT,
47 ReuseAddr => 1, 56 ReuseAddr => 1,
48 Listen => 1, 57 Listen => 50,
49 or die "unable to start server"; 58 or die "unable to start server";
50 59
51push @listen_sockets, $http_port; 60push @listen_sockets, $http_port;
52 61
53# the "main thread" 62# the "main thread"
70package conn; 79package conn;
71 80
72use Socket; 81use Socket;
73use HTTP::Date; 82use HTTP::Date;
74use Convert::Scalar 'weaken'; 83use Convert::Scalar 'weaken';
84use Linux::AIO;
75 85
86Linux::AIO::min_parallel $::AIO_PARALLEL;
87
88my $aio_requests = new Coro::Semaphore $::AIO_PARALLEL * 4;
89
90Event->io(fd => Linux::AIO::poll_fileno,
91 poll => 'r', async => 1,
92 cb => \&Linux::AIO::poll_cb);
93
76our %conn; # $conn{ip}{fh} => connobj 94our %conn; # $conn{ip}{self} => connobj
95our %uri; # $uri{ip}{uri}{self}
77our %blocked; 96our %blocked;
78our %mimetype; 97our %mimetype;
79 98
80sub read_mimetypes { 99sub read_mimetypes {
81 local *M; 100 local *M;
82 if (open M, "<mimetypes") { 101 if (open M, "<mime_types") {
83 while (<M>) { 102 while (<M>) {
84 if (/^([^#]\S+)\t+(\S+)$/) { 103 if (/^([^#]\S+)\t+(\S+)$/) {
85 $mimetype{lc $1} = $2; 104 $mimetype{lc $1} = $2;
86 } 105 }
87 } 106 }
88 } else { 107 } else {
89 $self->slog(1, "cannot open mimetypes\n"); 108 print "cannot open mime_types\n";
90 } 109 }
91} 110}
111
112read_mimetypes;
92 113
93sub new { 114sub new {
94 my $class = shift; 115 my $class = shift;
95 my $peername = shift; 116 my $peername = shift;
96 my $fh = shift; 117 my $fh = shift;
97 my $self = bless { fh => $fh }, $class; 118 my $self = bless { fh => $fh }, $class;
98 my (undef, $iaddr) = unpack_sockaddr_in $peername 119 my (undef, $iaddr) = unpack_sockaddr_in $peername
99 or $self->err(500, "unable to decode peername"); 120 or $self->err(500, "unable to decode peername");
100 121
101 $self->{remote_addr} = inet_ntoa $iaddr; 122 $self->{remote_addr} = inet_ntoa $iaddr;
123 $self->{time} = $::NOW;
102 124
103 # enter ourselves into various lists 125 # enter ourselves into various lists
104 weaken ($conn{$self->{remote_addr}}{$self*1} = $self); 126 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
105 127
128 $::conns++;
129
106 $self; 130 $self;
107} 131}
108 132
109sub DESTROY { 133sub DESTROY {
110 my $self = shift; 134 my $self = shift;
135
136 $::conns--;
137
138 $self->eoconn;
111 delete $conn{$self->{remote_addr}}{$self*1}; 139 delete $conn{$self->{remote_addr}}{$self*1};
140}
141
142# end of connection
143sub eoconn {
144 my $self = shift;
112 delete $uri{$self->{uri}}{$self*1}; 145 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
113} 146}
114 147
115sub slog { 148sub slog {
116 my $self = shift; 149 my $self = shift;
117 main::slog($_[0], "$self->{remote_addr}> $_[1]"); 150 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
118} 151}
119 152
120sub response { 153sub response {
121 my ($self, $code, $msg, $hdr, $content) = @_; 154 my ($self, $code, $msg, $hdr, $content) = @_;
122 my $res = "HTTP/1.0 $code $msg\015\012"; 155 my $res = "HTTP/1.1 $code $msg\015\012";
123 156
124 $res .= "Connection: close\015\012"; 157 $self->{h}{connection} ||= $hdr->{Connection};
158
125 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( 159 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
126 160
127 while (my ($h, $v) = each %$hdr) { 161 while (my ($h, $v) = each %$hdr) {
128 $res .= "$h: $v\015\012" 162 $res .= "$h: $v\015\012"
129 } 163 }
164 $res .= "\015\012";
130 165
131 $res .= "\015\012$content" if defined $content; 166 $res .= $content if defined $content and $self->{method} ne "HEAD";
132 167
133 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d# 168 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
134 169
170 print $accesslog $log if $accesslog;
171 print STDERR $log;
172
173 $self->{written} +=
135 print {$self->{fh}} $res; 174 print {$self->{fh}} $res;
136} 175}
137 176
138sub err { 177sub err {
139 my $self = shift; 178 my $self = shift;
140 my ($code, $msg, $hdr, $content) = @_; 179 my ($code, $msg, $hdr, $content) = @_;
142 unless (defined $content) { 181 unless (defined $content) {
143 $content = "$code $msg"; 182 $content = "$code $msg";
144 $hdr->{"Content-Type"} = "text/plain"; 183 $hdr->{"Content-Type"} = "text/plain";
145 $hdr->{"Content-Length"} = length $content; 184 $hdr->{"Content-Length"} = length $content;
146 } 185 }
186 $hdr->{"Connection"} = "close";
147 187
148 $self->response($code, $msg, $hdr, $content); 188 $self->response($code, $msg, $hdr, $content);
149 189
150 die bless {}, err::; 190 die bless {}, err::;
151} 191}
152 192
153sub err_blocked { 193sub err_blocked {
154 my $self = shift; 194 my $self = shift;
155 my $ip = $self->{remote_addr}; 195 my $ip = $self->{remote_addr};
156 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME; 196 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
197
198 Coro::Event::do_timer(after => 20*rand);
199
157 $self->err(403, "too many connections", 200 $self->err(401, "too many connections",
158 { 201 {
159 "Content-Type" => "text/html", 202 "Content-Type" => "text/html",
160 "Retry-After" => $::BLOCKTIME 203 "Retry-After" => $::BLOCKTIME,
204 "Warning" => "Please do NOT retry, you have been blocked",
205 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
206 "Connection" => "close",
161 }, 207 },
162 <<EOF); 208 <<EOF);
163<html><p> 209<html>
210<head>
211<title>Too many connections</title>
212</head>
213<body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
214
164You have been blocked because you opened too many connections. You 215<p>You have been blocked because you opened too many connections. You
165may retry at</p> 216may retry at</p>
166 217
167 <p><blockquote>$time.</blockquote></p> 218 <p><blockquote>$time.</blockquote></p>
168 219
169<p>Until then, each new access will renew the block. You might want to have a 220<p>Until then, each new access will renew the block. You might want to have a
170look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p> 221look at the <a href="http://www.goof.com/pcg/marc/animefaq.html#connectionlimit">FAQ</a>.</p>
171</html> 222
223</body></html>
172EOF 224EOF
173} 225}
174 226
175sub handle { 227sub handle {
176 my $self = shift; 228 my $self = shift;
177 my $fh = $self->{fh}; 229 my $fh = $self->{fh};
178 230
231 my $host;
232
233 $fh->timeout($::REQ_TIMEOUT);
179 #while() { 234 while() {
235 $self->{reqs}++;
236
237 # read request and parse first line
238 my $req = $fh->readline("\015\012\015\012");
239
240 unless (defined $req) {
241 if (exists $self->{version}) {
242 last;
243 } else {
244 $self->err(408, "request timeout");
245 }
246 }
247
180 $self->{h} = {}; 248 $self->{h} = {};
181 249
182 # read request and parse first line
183 $fh->timeout($::REQ_TIMEOUT);
184 my $req = $fh->readline("\015\012\015\012");
185 $fh->timeout($::RES_TIMEOUT); 250 $fh->timeout($::RES_TIMEOUT);
186
187 defined $req or
188 $self->err(408, "request timeout");
189
190 my $ip = $self->{remote_addr}; 251 my $ip = $self->{remote_addr};
191 252
192 if ($blocked{$ip}) { 253 if ($blocked{$ip}) {
193 $self->err_blocked($blocked{$ip}) 254 $self->err_blocked($blocked{$ip})
194 if $blocked{$ip} > $::NOW; 255 if $blocked{$ip} > $::NOW;
195 256
196 delete $blocked{$ip}; 257 delete $blocked{$ip};
197 } 258 }
198 259
199 if (%{$conn{$ip}} > $::MAX_CONN_IP) { 260 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
200 $self->slog("blocked ip $ip"); 261 $self->slog(2, "blocked ip $ip");
201 $self->err_blocked; 262 $self->err_blocked;
202 } 263 }
203 264
204 $req =~ /^(?:\015\012)? 265 $req =~ /^(?:\015\012)?
205 (GET|HEAD) \040+ 266 (GET|HEAD) \040+
206 ([^\040]+) \040+ 267 ([^\040]+) \040+
207 HTTP\/([0-9]+\.[0-9]+) 268 HTTP\/([0-9]+\.[0-9]+)
208 \015\012/gx 269 \015\012/gx
209 or $self->err(403, "method not allowed", { Allow => "GET,HEAD" }); 270 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
210
211 $2 ne "1.0"
212 or $self->err(506, "http protocol version not supported");
213 271
214 $self->{method} = $1; 272 $self->{method} = $1;
215 $self->{uri} = $2; 273 $self->{uri} = $2;
274 $self->{version} = $3;
275
276 $3 =~ /^1\./
277 or $self->err(506, "http protocol version $3 not supported");
216 278
217 # parse headers 279 # parse headers
218 { 280 {
219 my (%hdr, $h, $v); 281 my (%hdr, $h, $v);
220 282
231 293
232 $self->{h}{$h} = substr $v, 1 294 $self->{h}{$h} = substr $v, 1
233 while ($h, $v) = each %hdr; 295 while ($h, $v) = each %hdr;
234 } 296 }
235 297
298 # find out server name and port
299 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
300 $host = $1;
301 } else {
302 $host = $self->{h}{host};
303 }
304
305 if (defined $host) {
236 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80; 306 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
307 } else {
308 ($self->{server_port}, $host)
309 = unpack_sockaddr_in $self->{fh}->getsockname
310 or $self->err(500, "unable to get socket name");
311 $host = inet_ntoa $host;
312 }
237 313
314 $self->{server_name} = $host;
315
316 # remote id should be unique per user
317 $self->{remote_id} = $self->{remote_addr};
318
319 if (exists $self->{h}{"client-ip"}) {
320 $self->{remote_id} .= "[".$self->{h}{"client-ip"}."]";
321 } elsif (exists $self->{h}{"x-forwarded-for"}) {
322 $self->{remote_id} .= "[".$self->{h}{"x-forwarded-for"}."]";
323 }
324
238 weaken ($uri{$self->{uri}}{$self*1} = $self); 325 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
239 326
327 eval {
240 $self->map_uri; 328 $self->map_uri;
241 $self->respond; 329 $self->respond;
330 };
331
332 $self->eoconn;
333
334 die if $@ && !ref $@;
335
336 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1;
337
338 $fh->timeout($::PER_TIMEOUT);
242 #} 339 }
243} 340}
244 341
245# uri => path mapping 342# uri => path mapping
246sub map_uri { 343sub map_uri {
247 my $self = shift; 344 my $self = shift;
248 my $host = $self->{h}{host} || "default"; 345 my $host = $self->{server_name};
249 my $uri = $self->{uri}; 346 my $uri = $self->{uri};
250 347
251 # some massaging, also makes it more secure 348 # some massaging, also makes it more secure
252 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; 349 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
253 $uri =~ s%//+%/%g; 350 $uri =~ s%//+%/%g;
263 $self->{path} = "$::DOCROOT/$host$uri"; 360 $self->{path} = "$::DOCROOT/$host$uri";
264 361
265 $self->access_check; 362 $self->access_check;
266} 363}
267 364
268sub server_address {
269 my $self = shift;
270 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
271 or $self->err(500, "unable to get socket name");
272 ((inet_ntoa $iaddr), $port);
273}
274
275sub server_host {
276 my $self = shift;
277 if (exists $self->{h}{host}) {
278 return $self->{h}{host};
279 } else {
280 return (($self->server_address)[0]);
281 }
282}
283
284sub server_hostport {
285 my $self = shift;
286 my ($host, $port);
287 if (exists $self->{h}{host}) {
288 ($host, $port) = ($self->{h}{host}, $self->{server_port});
289 } else {
290 ($host, $port) = $self->server_address;
291 }
292 $port = $port == 80 ? "" : ":$port";
293 $host.$port;
294}
295
296sub _cgi { 365sub _cgi {
297 my $self = shift; 366 my $self = shift;
298 my $path = shift; 367 my $path = shift;
299 my $fh; 368 my $fh;
300 369
301 # no two-way xxx supported 370 # no two-way xxx supported
302 if (0 == fork) { 371 if (0 == fork) {
303 open STDOUT, ">&".fileno($self->{fh}); 372 open STDOUT, ">&".fileno($self->{fh});
304 if (chdir $::DOCROOT) { 373 if (chdir $::DOCROOT) {
305 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike 374 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
306 $ENV{HTTP_HOST} = $self->server_host; 375 $ENV{HTTP_HOST} = $self->{server_name};
307 $ENV{HTTP_PORT} = $self->{server_host}; 376 $ENV{HTTP_PORT} = $self->{server_port};
308 $ENV{SCRIPT_NAME} = $self->{name}; 377 $ENV{SCRIPT_NAME} = $self->{name};
309 exec $::INDEXPROG; 378 exec $path;
310 } 379 }
311 Coro::State::_exit(0); 380 Coro::State::_exit(0);
312 } else { 381 } else {
382 die;
313 } 383 }
384}
385
386sub server_hostport {
387 $_[0]{server_port} == 80
388 ? $_[0]{server_name}
389 : "$_[0]{server_name}:$_[0]{server_port}";
314} 390}
315 391
316sub respond { 392sub respond {
317 my $self = shift; 393 my $self = shift;
318 my $path = $self->{path}; 394 my $path = $self->{path};
319 395
320 stat $path 396 stat $path
321 or $self->err(404, "not found"); 397 or $self->err(404, "not found");
398
399 $self->{stat} = [stat _];
322 400
323 # idiotic netscape sends idiotic headers AGAIN 401 # idiotic netscape sends idiotic headers AGAIN
324 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ 402 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
325 ? str2time $1 : 0; 403 ? str2time $1 : 0;
326 404
327 if (-d _ && -r _) { 405 if (-d _ && -r _) {
328 # directory 406 # directory
329 if ($path !~ /\/$/) { 407 if ($path !~ /\/$/) {
330 # create a redirect to get the trailing "/" 408 # create a redirect to get the trailing "/"
331 my $host = $self->server_hostport; 409 # we don't try to avoid the :80
332 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" }); 410 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
333 } else { 411 } else {
334 $ims < (stat _)[9] 412 $ims < $self->{stat}[9]
335 or $self->err(304, "not modified"); 413 or $self->err(304, "not modified");
336 414
337 if ($self->{method} eq "GET") {
338 if (-r "$path/index.html") { 415 if (-r "$path/index.html") {
339 $self->{path} .= "/index.html"; 416 $self->{path} .= "/index.html";
340 $self->handle_file; 417 $self->handle_file;
341 } else { 418 } else {
342 $self->handle_dir; 419 $self->handle_dir;
343 }
344 } 420 }
345 } 421 }
346 } elsif (-f _ && -r _) { 422 } elsif (-f _ && -r _) {
347 -x _ and $self->err(403, "forbidden"); 423 -x _ and $self->err(403, "forbidden");
348 $self->handle_file; 424 $self->handle_file;
351 } 427 }
352} 428}
353 429
354sub handle_dir { 430sub handle_dir {
355 my $self = shift; 431 my $self = shift;
356 $self->_cgi($::INDEXPROG); 432 my $idx = $self->diridx;
433
434 $self->response(200, "ok",
435 {
436 "Content-Type" => "text/html",
437 "Content-Length" => length $idx,
438 },
439 $idx);
357} 440}
358 441
359sub handle_file { 442sub handle_file {
360 my $self = shift; 443 my $self = shift;
361 my $length = -s _; 444 my $length = -s _;
374 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1); 457 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
375 } else { 458 } else {
376 ($l, $h) = (0, $length - 1); 459 ($l, $h) = (0, $length - 1);
377 goto ignore; 460 goto ignore;
378 } 461 }
379 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l; 462 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
380 } 463 }
381 $hdr->{"Content-Range"} = "bytes */$length"; 464 $hdr->{"Content-Range"} = "bytes */$length";
465 $hdr->{"Content-Length"} = $length;
466 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
382 $self->err(416, "not satisfiable", $hdr); 467 $self->err(416, "not satisfiable", $hdr, "");
383 468
384satisfiable: 469satisfiable:
385 # check for segmented downloads 470 # check for segmented downloads
386 if ($l && $NO_SEGMENTED) { 471 if ($l && $::NO_SEGMENTED) {
387 if (%{$uri{$self->{uri}}} > 1) { 472 my $delay = 60;
388 $self->slog("segmented download refused\n"); 473 while (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
474 if ($delay <= 0) {
389 $self->err(400, "segmented downloads are not allowed"); 475 $self->err(400, "segmented downloads are not allowed",
476 { "Content-Type" => "text/html", Connection => "close" }, <<EOF);
477<html>
478<head>
479<title>Segmented downloads are not allowed</title>
480</head>
481<body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
482
483<p>Segmented downloads are not allowed on this server. Please refer to the
484<a href="http://www.goof.com/pcg/marc/animefaq.html#segmented_downloads">FAQ</a>.</p>
485
486</body></html>
487EOF
488 } else {
489 Coro::Event::do_timer(after => 3); $delay -= 3;
490 }
390 } 491 }
391 } 492 }
392 493
393 $hdr->{"Content-Range"} = "bytes $l-$h/$length"; 494 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
394 @code = (206, "partial content"); 495 @code = (206, "partial content");
404 $hdr->{"Content-Length"} = $length; 505 $hdr->{"Content-Length"} = $length;
405 506
406 $self->response(@code, $hdr, ""); 507 $self->response(@code, $hdr, "");
407 508
408 if ($self->{method} eq "GET") { 509 if ($self->{method} eq "GET") {
409 my ($fh, $buf); 510 my ($fh, $buf, $r);
511 my $current = $Coro::current;
410 open $fh, "<", $self->{path} 512 open $fh, "<", $self->{path}
411 or die "$self->{path}: late open failure ($!)"; 513 or die "$self->{path}: late open failure ($!)";
412 514
413 if ($l) {
414 sysseek $fh, $l, 0
415 or die "$self->{path}: cannot seek to $l ($!)";
416 }
417
418 $h -= $l - 1; 515 $h -= $l - 1;
419 516
517 if (0) {
518 if ($l) {
519 sysseek $fh, $l, 0;
520 }
521 }
522
420 while ($h > 0) { 523 while ($h > 0) {
524 if (0) {
421 $h -= sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h; 525 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
526 or last;
527 } else {
528 undef $buf;
529 $aio_requests->down;
530 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
531 $buf, 0, sub {
532 $r = $_[0];
533 $current->ready;
534 });
535 &Coro::schedule;
536 $aio_requests->up;
537 last unless $r;
538 }
422 $self->{fh}->syswrite($buf) 539 my $w = $self->{fh}->syswrite($buf)
423 or last; 540 or last;
541 $::written += $w;
542 $self->{written} += $w;
543 $l += $r;
424 } 544 }
425 } 545 }
426 546
427 close $fh; 547 close $fh;
428} 548}

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines