ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.29
Committed: Sat Aug 25 15:14:03 2001 UTC (22 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.28: +55 -41 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5
6 no utf8;
7 use bytes;
8
9 # at least on my machine, this thingy serves files
10 # quite a bit faster than apache, ;)
11 # and quite a bit slower than thttpd :(
12
13 $SIG{PIPE} = 'IGNORE';
14
15 our $accesslog;
16
17 if ($ACCESS_LOG) {
18 use IO::Handle;
19 open $accesslog, ">>$ACCESS_LOG"
20 or die "$ACCESS_LOG: $!";
21 $accesslog->autoflush(1);
22 }
23
24 sub slog {
25 my $level = shift;
26 my $format = shift;
27 printf "---: $format\n", @_;
28 }
29
30 my $connections = new Coro::Semaphore $MAX_CONNECTS;
31
32 my @newcons;
33 my @pool;
34
35 # one "execution thread"
36 sub handler {
37 while () {
38 my $new = pop @newcons;
39 if ($new) {
40 eval {
41 conn->new(@$new)->handle;
42 };
43 slog 1, "$@" if $@ && !ref $@;
44 $connections->up;
45 } else {
46 last if @pool >= $MAX_POOL;
47 push @pool, $Coro::current;
48 schedule;
49 }
50 }
51 }
52
53 my $http_port = new Coro::Socket
54 LocalAddr => $SERVER_HOST,
55 LocalPort => $SERVER_PORT,
56 ReuseAddr => 1,
57 Listen => 50,
58 or die "unable to start server";
59
60 push @listen_sockets, $http_port;
61
62 # the "main thread"
63 async {
64 slog 1, "accepting connections";
65 while () {
66 $connections->down;
67 push @newcons, [$http_port->accept];
68 #slog 3, "accepted @$connections ".scalar(@pool);
69 $::NOW = time;
70 if (@pool) {
71 (pop @pool)->ready;
72 } else {
73 async \&handler;
74 }
75
76 }
77 };
78
79 package conn;
80
81 use Socket;
82 use HTTP::Date;
83 use Convert::Scalar 'weaken';
84 use Linux::AIO;
85
86 Linux::AIO::min_parallel $::AIO_PARALLEL;
87
88 my $aio_requests = new Coro::Semaphore $::AIO_PARALLEL * 4;
89
90 Event->io(fd => Linux::AIO::poll_fileno,
91 poll => 'r', async => 1,
92 cb => \&Linux::AIO::poll_cb);
93
94 our %conn; # $conn{ip}{self} => connobj
95 our %uri; # $uri{ip}{uri}{self}
96 our %blocked;
97 our %mimetype;
98
99 sub read_mimetypes {
100 local *M;
101 if (open M, "<mime_types") {
102 while (<M>) {
103 if (/^([^#]\S+)\t+(\S+)$/) {
104 $mimetype{lc $1} = $2;
105 }
106 }
107 } else {
108 print "cannot open mime_types\n";
109 }
110 }
111
112 read_mimetypes;
113
114 sub new {
115 my $class = shift;
116 my $peername = shift;
117 my $fh = shift;
118 my $self = bless { fh => $fh }, $class;
119 my (undef, $iaddr) = unpack_sockaddr_in $peername
120 or $self->err(500, "unable to decode peername");
121
122 $self->{remote_addr} = inet_ntoa $iaddr;
123 $self->{time} = $::NOW;
124
125 # enter ourselves into various lists
126 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
127
128 $::conns++;
129
130 $self;
131 }
132
133 sub DESTROY {
134 my $self = shift;
135
136 $::conns--;
137
138 $self->eoconn;
139 delete $conn{$self->{remote_addr}}{$self*1};
140 }
141
142 # end of connection
143 sub eoconn {
144 my $self = shift;
145 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
146 }
147
148 sub slog {
149 my $self = shift;
150 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
151 }
152
153 sub response {
154 my ($self, $code, $msg, $hdr, $content) = @_;
155 my $res = "HTTP/1.1 $code $msg\015\012";
156
157 $self->{h}{connection} ||= $hdr->{Connection};
158
159 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
160
161 while (my ($h, $v) = each %$hdr) {
162 $res .= "$h: $v\015\012"
163 }
164 $res .= "\015\012";
165
166 $res .= $content if defined $content and $self->{method} ne "HEAD";
167
168 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
169
170 print $accesslog $log if $accesslog;
171 print STDERR $log;
172
173 $self->{written} +=
174 print {$self->{fh}} $res;
175 }
176
177 sub err {
178 my $self = shift;
179 my ($code, $msg, $hdr, $content) = @_;
180
181 unless (defined $content) {
182 $content = "$code $msg";
183 $hdr->{"Content-Type"} = "text/plain";
184 $hdr->{"Content-Length"} = length $content;
185 }
186 $hdr->{"Connection"} = "close";
187
188 $self->response($code, $msg, $hdr, $content);
189
190 die bless {}, err::;
191 }
192
193 sub err_blocked {
194 my $self = shift;
195 my $ip = $self->{remote_addr};
196 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
197
198 Coro::Event::do_timer(after => 20*rand);
199
200 $self->err(401, "too many connections",
201 {
202 "Content-Type" => "text/html",
203 "Retry-After" => $::BLOCKTIME,
204 "Warning" => "Please do NOT retry, you have been blocked",
205 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
206 "Connection" => "close",
207 },
208 <<EOF);
209 <html>
210 <head>
211 <title>Too many connections</title>
212 </head>
213 <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
214
215 <p>You have been blocked because you opened too many connections. You
216 may retry at</p>
217
218 <p><blockquote>$time.</blockquote></p>
219
220 <p>Until then, each new access will renew the block. You might want to have a
221 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html#connectionlimit">FAQ</a>.</p>
222
223 </body></html>
224 EOF
225 }
226
227 sub handle {
228 my $self = shift;
229 my $fh = $self->{fh};
230
231 my $host;
232
233 $fh->timeout($::REQ_TIMEOUT);
234 while() {
235 $self->{reqs}++;
236
237 # read request and parse first line
238 my $req = $fh->readline("\015\012\015\012");
239
240 unless (defined $req) {
241 if (exists $self->{version}) {
242 last;
243 } else {
244 $self->err(408, "request timeout");
245 }
246 }
247
248 $self->{h} = {};
249
250 $fh->timeout($::RES_TIMEOUT);
251 my $ip = $self->{remote_addr};
252
253 if ($blocked{$ip}) {
254 $self->err_blocked($blocked{$ip})
255 if $blocked{$ip} > $::NOW;
256
257 delete $blocked{$ip};
258 }
259
260 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
261 $self->slog(2, "blocked ip $ip");
262 $self->err_blocked;
263 }
264
265 $req =~ /^(?:\015\012)?
266 (GET|HEAD) \040+
267 ([^\040]+) \040+
268 HTTP\/([0-9]+\.[0-9]+)
269 \015\012/gx
270 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
271
272 $self->{method} = $1;
273 $self->{uri} = $2;
274 $self->{version} = $3;
275
276 $3 =~ /^1\./
277 or $self->err(506, "http protocol version $3 not supported");
278
279 # parse headers
280 {
281 my (%hdr, $h, $v);
282
283 $hdr{lc $1} .= ",$2"
284 while $req =~ /\G
285 ([^:\000-\040]+):
286 [\008\040]*
287 ((?: [^\015\012]+ | \015\012[\008\040] )*)
288 \015\012
289 /gxc;
290
291 $req =~ /\G\015\012$/
292 or $self->err(400, "bad request");
293
294 $self->{h}{$h} = substr $v, 1
295 while ($h, $v) = each %hdr;
296 }
297
298 # find out server name and port
299 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
300 $host = $1;
301 } else {
302 $host = $self->{h}{host};
303 }
304
305 if (defined $host) {
306 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
307 } else {
308 ($self->{server_port}, $host)
309 = unpack_sockaddr_in $self->{fh}->getsockname
310 or $self->err(500, "unable to get socket name");
311 $host = inet_ntoa $host;
312 }
313
314 $self->{server_name} = $host;
315
316 # remote id should be unique per user
317 $self->{remote_id} = $self->{remote_addr};
318
319 if (exists $self->{h}{"client-ip"}) {
320 $self->{remote_id} .= "[".$self->{h}{"client-ip"}."]";
321 } elsif (exists $self->{h}{"x-forwarded-for"}) {
322 $self->{remote_id} .= "[".$self->{h}{"x-forwarded-for"}."]";
323 }
324
325 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
326
327 eval {
328 $self->map_uri;
329 $self->respond;
330 };
331
332 $self->eoconn;
333
334 die if $@ && !ref $@;
335
336 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1;
337
338 $fh->timeout($::PER_TIMEOUT);
339 }
340 }
341
342 # uri => path mapping
343 sub map_uri {
344 my $self = shift;
345 my $host = $self->{server_name};
346 my $uri = $self->{uri};
347
348 # some massaging, also makes it more secure
349 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
350 $uri =~ s%//+%/%g;
351 $uri =~ s%/\.(?=/|$)%%g;
352 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
353
354 $uri =~ m%^/?\.\.(?=/|$)%
355 and $self->err(400, "bad request");
356
357 $self->{name} = $uri;
358
359 # now do the path mapping
360 $self->{path} = "$::DOCROOT/$host$uri";
361
362 $self->access_check;
363 }
364
365 sub _cgi {
366 my $self = shift;
367 my $path = shift;
368 my $fh;
369
370 # no two-way xxx supported
371 if (0 == fork) {
372 open STDOUT, ">&".fileno($self->{fh});
373 if (chdir $::DOCROOT) {
374 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
375 $ENV{HTTP_HOST} = $self->{server_name};
376 $ENV{HTTP_PORT} = $self->{server_port};
377 $ENV{SCRIPT_NAME} = $self->{name};
378 exec $path;
379 }
380 Coro::State::_exit(0);
381 } else {
382 die;
383 }
384 }
385
386 sub server_hostport {
387 $_[0]{server_port} == 80
388 ? $_[0]{server_name}
389 : "$_[0]{server_name}:$_[0]{server_port}";
390 }
391
392 sub respond {
393 my $self = shift;
394 my $path = $self->{path};
395
396 stat $path
397 or $self->err(404, "not found");
398
399 $self->{stat} = [stat _];
400
401 # idiotic netscape sends idiotic headers AGAIN
402 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
403 ? str2time $1 : 0;
404
405 if (-d _ && -r _) {
406 # directory
407 if ($path !~ /\/$/) {
408 # create a redirect to get the trailing "/"
409 # we don't try to avoid the :80
410 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
411 } else {
412 $ims < $self->{stat}[9]
413 or $self->err(304, "not modified");
414
415 if (-r "$path/index.html") {
416 $self->{path} .= "/index.html";
417 $self->handle_file;
418 } else {
419 $self->handle_dir;
420 }
421 }
422 } elsif (-f _ && -r _) {
423 -x _ and $self->err(403, "forbidden");
424 $self->handle_file;
425 } else {
426 $self->err(404, "not found");
427 }
428 }
429
430 sub handle_dir {
431 my $self = shift;
432 my $idx = $self->diridx;
433
434 $self->response(200, "ok",
435 {
436 "Content-Type" => "text/html",
437 "Content-Length" => length $idx,
438 },
439 $idx);
440 }
441
442 sub handle_file {
443 my $self = shift;
444 my $length = -s _;
445 my $hdr = {
446 "Last-Modified" => time2str ((stat _)[9]),
447 };
448
449 my @code = (200, "ok");
450 my ($l, $h);
451
452 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
453 for (split /,/, $1) {
454 if (/^-(\d+)$/) {
455 ($l, $h) = ($length - $1, $length - 1);
456 } elsif (/^(\d+)-(\d*)$/) {
457 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
458 } else {
459 ($l, $h) = (0, $length - 1);
460 goto ignore;
461 }
462 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
463 }
464 $hdr->{"Content-Range"} = "bytes */$length";
465 $hdr->{"Content-Length"} = $length;
466 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
467 $self->err(416, "not satisfiable", $hdr, "");
468
469 satisfiable:
470 # check for segmented downloads
471 if ($l && $::NO_SEGMENTED) {
472 my $delay = 60;
473 while (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
474 if ($delay <= 0) {
475 $self->err(400, "segmented downloads are not allowed",
476 { "Content-Type" => "text/html", Connection => "close" }, <<EOF);
477 <html>
478 <head>
479 <title>Segmented downloads are not allowed</title>
480 </head>
481 <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
482
483 <p>Segmented downloads are not allowed on this server. Please refer to the
484 <a href="http://www.goof.com/pcg/marc/animefaq.html#segmented_downloads">FAQ</a>.</p>
485
486 </body></html>
487 EOF
488 } else {
489 Coro::Event::do_timer(after => 3); $delay -= 3;
490 }
491 }
492 }
493
494 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
495 @code = (206, "partial content");
496 $length = $h - $l + 1;
497
498 ignore:
499 } else {
500 ($l, $h) = (0, $length - 1);
501 }
502
503 $self->{path} =~ /\.([^.]+)$/;
504 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
505 $hdr->{"Content-Length"} = $length;
506
507 $self->response(@code, $hdr, "");
508
509 if ($self->{method} eq "GET") {
510 my ($fh, $buf, $r);
511 my $current = $Coro::current;
512 open $fh, "<", $self->{path}
513 or die "$self->{path}: late open failure ($!)";
514
515 $h -= $l - 1;
516
517 if (0) {
518 if ($l) {
519 sysseek $fh, $l, 0;
520 }
521 }
522
523 while ($h > 0) {
524 if (0) {
525 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
526 or last;
527 } else {
528 undef $buf;
529 $aio_requests->down;
530 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
531 $buf, 0, sub {
532 $r = $_[0];
533 $current->ready;
534 });
535 &Coro::schedule;
536 $aio_requests->up;
537 last unless $r;
538 }
539 my $w = $self->{fh}->syswrite($buf)
540 or last;
541 $::written += $w;
542 $self->{written} += $w;
543 $l += $r;
544 }
545 }
546
547 close $fh;
548 }
549
550 1;