ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.29
Committed: Sat Aug 25 15:14:03 2001 UTC (22 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.28: +55 -41 lines
Log Message:
*** empty log message ***

File Contents

# User Rev Content
1 root 1.1 use Coro;
2     use Coro::Semaphore;
3     use Coro::Event;
4     use Coro::Socket;
5    
6     no utf8;
7     use bytes;
8    
9     # at least on my machine, this thingy serves files
10     # quite a bit faster than apache, ;)
11     # and quite a bit slower than thttpd :(
12    
13     $SIG{PIPE} = 'IGNORE';
14 root 1.27
15     our $accesslog;
16    
17     if ($ACCESS_LOG) {
18     use IO::Handle;
19     open $accesslog, ">>$ACCESS_LOG"
20     or die "$ACCESS_LOG: $!";
21     $accesslog->autoflush(1);
22     }
23    
24 root 1.1 sub slog {
25     my $level = shift;
26     my $format = shift;
27     printf "---: $format\n", @_;
28     }
29    
30     my $connections = new Coro::Semaphore $MAX_CONNECTS;
31    
32 root 1.6 my @newcons;
33 root 1.1 my @pool;
34    
35 root 1.2 # one "execution thread"
36 root 1.1 sub handler {
37     while () {
38 root 1.6 my $new = pop @newcons;
39     if ($new) {
40 root 1.1 eval {
41 root 1.6 conn->new(@$new)->handle;
42 root 1.1 };
43     slog 1, "$@" if $@ && !ref $@;
44     $connections->up;
45     } else {
46     last if @pool >= $MAX_POOL;
47     push @pool, $Coro::current;
48     schedule;
49     }
50     }
51     }
52    
53 root 1.4 my $http_port = new Coro::Socket
54     LocalAddr => $SERVER_HOST,
55     LocalPort => $SERVER_PORT,
56     ReuseAddr => 1,
57 root 1.13 Listen => 50,
58 root 1.4 or die "unable to start server";
59    
60     push @listen_sockets, $http_port;
61    
62 root 1.2 # the "main thread"
63 root 1.1 async {
64     slog 1, "accepting connections";
65     while () {
66     $connections->down;
67 root 1.6 push @newcons, [$http_port->accept];
68 root 1.1 #slog 3, "accepted @$connections ".scalar(@pool);
69 root 1.3 $::NOW = time;
70 root 1.1 if (@pool) {
71     (pop @pool)->ready;
72     } else {
73     async \&handler;
74     }
75    
76     }
77     };
78    
79     package conn;
80    
81     use Socket;
82     use HTTP::Date;
83 root 1.2 use Convert::Scalar 'weaken';
84 root 1.16 use Linux::AIO;
85    
86     Linux::AIO::min_parallel $::AIO_PARALLEL;
87    
88 root 1.29 my $aio_requests = new Coro::Semaphore $::AIO_PARALLEL * 4;
89    
90 root 1.16 Event->io(fd => Linux::AIO::poll_fileno,
91 root 1.17 poll => 'r', async => 1,
92 root 1.21 cb => \&Linux::AIO::poll_cb);
93 root 1.16
94 root 1.26 our %conn; # $conn{ip}{self} => connobj
95     our %uri; # $uri{ip}{uri}{self}
96 root 1.3 our %blocked;
97 root 1.9 our %mimetype;
98    
99     sub read_mimetypes {
100     local *M;
101 root 1.10 if (open M, "<mime_types") {
102 root 1.9 while (<M>) {
103     if (/^([^#]\S+)\t+(\S+)$/) {
104     $mimetype{lc $1} = $2;
105     }
106     }
107     } else {
108 root 1.10 print "cannot open mime_types\n";
109 root 1.9 }
110     }
111 root 1.1
112 root 1.10 read_mimetypes;
113    
114 root 1.1 sub new {
115     my $class = shift;
116 root 1.6 my $peername = shift;
117 root 1.1 my $fh = shift;
118 root 1.2 my $self = bless { fh => $fh }, $class;
119 root 1.6 my (undef, $iaddr) = unpack_sockaddr_in $peername
120     or $self->err(500, "unable to decode peername");
121 root 1.7
122 root 1.3 $self->{remote_addr} = inet_ntoa $iaddr;
123 root 1.11 $self->{time} = $::NOW;
124 root 1.2
125     # enter ourselves into various lists
126 root 1.3 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
127    
128 root 1.13 $::conns++;
129    
130 root 1.2 $self;
131     }
132    
133     sub DESTROY {
134     my $self = shift;
135 root 1.13
136     $::conns--;
137    
138 root 1.19 $self->eoconn;
139 root 1.3 delete $conn{$self->{remote_addr}}{$self*1};
140 root 1.19 }
141    
142     # end of connection
143     sub eoconn {
144 root 1.26 my $self = shift;
145 root 1.13 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
146 root 1.1 }
147    
148     sub slog {
149 root 1.4 my $self = shift;
150 root 1.29 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
151 root 1.1 }
152    
153 root 1.4 sub response {
154 root 1.1 my ($self, $code, $msg, $hdr, $content) = @_;
155 root 1.17 my $res = "HTTP/1.1 $code $msg\015\012";
156 root 1.1
157 root 1.28 $self->{h}{connection} ||= $hdr->{Connection};
158    
159 root 1.4 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
160 root 1.1
161     while (my ($h, $v) = each %$hdr) {
162     $res .= "$h: $v\015\012"
163     }
164 root 1.10 $res .= "\015\012";
165 root 1.4
166 root 1.13 $res .= $content if defined $content and $self->{method} ne "HEAD";
167 root 1.1
168 root 1.27 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
169    
170     print $accesslog $log if $accesslog;
171     print STDERR $log;
172 root 1.2
173 root 1.11 $self->{written} +=
174     print {$self->{fh}} $res;
175 root 1.1 }
176    
177     sub err {
178     my $self = shift;
179     my ($code, $msg, $hdr, $content) = @_;
180    
181     unless (defined $content) {
182     $content = "$code $msg";
183     $hdr->{"Content-Type"} = "text/plain";
184     $hdr->{"Content-Length"} = length $content;
185     }
186 root 1.17 $hdr->{"Connection"} = "close";
187 root 1.1
188 root 1.4 $self->response($code, $msg, $hdr, $content);
189 root 1.1
190     die bless {}, err::;
191     }
192    
193 root 1.3 sub err_blocked {
194     my $self = shift;
195     my $ip = $self->{remote_addr};
196     my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
197 root 1.10
198 root 1.20 Coro::Event::do_timer(after => 20*rand);
199 root 1.14
200     $self->err(401, "too many connections",
201 root 1.4 {
202     "Content-Type" => "text/html",
203 root 1.20 "Retry-After" => $::BLOCKTIME,
204     "Warning" => "Please do NOT retry, you have been blocked",
205     "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
206 root 1.28 "Connection" => "close",
207 root 1.4 },
208 root 1.3 <<EOF);
209 root 1.27 <html>
210     <head>
211     <title>Too many connections</title>
212     </head>
213     <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
214    
215     <p>You have been blocked because you opened too many connections. You
216 root 1.4 may retry at</p>
217    
218     <p><blockquote>$time.</blockquote></p>
219    
220     <p>Until then, each new access will renew the block. You might want to have a
221 root 1.28 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html#connectionlimit">FAQ</a>.</p>
222 root 1.27
223     </body></html>
224 root 1.3 EOF
225     }
226    
227 root 1.1 sub handle {
228     my $self = shift;
229     my $fh = $self->{fh};
230    
231 root 1.29 my $host;
232    
233 root 1.17 $fh->timeout($::REQ_TIMEOUT);
234     while() {
235     $self->{reqs}++;
236 root 1.1
237     # read request and parse first line
238     my $req = $fh->readline("\015\012\015\012");
239    
240 root 1.17 unless (defined $req) {
241     if (exists $self->{version}) {
242     last;
243     } else {
244     $self->err(408, "request timeout");
245     }
246     }
247    
248     $self->{h} = {};
249 root 1.1
250 root 1.17 $fh->timeout($::RES_TIMEOUT);
251 root 1.3 my $ip = $self->{remote_addr};
252    
253     if ($blocked{$ip}) {
254     $self->err_blocked($blocked{$ip})
255     if $blocked{$ip} > $::NOW;
256    
257     delete $blocked{$ip};
258     }
259    
260     if (%{$conn{$ip}} > $::MAX_CONN_IP) {
261 root 1.12 $self->slog(2, "blocked ip $ip");
262 root 1.3 $self->err_blocked;
263     }
264    
265 root 1.1 $req =~ /^(?:\015\012)?
266     (GET|HEAD) \040+
267     ([^\040]+) \040+
268     HTTP\/([0-9]+\.[0-9]+)
269     \015\012/gx
270 root 1.14 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
271 root 1.1
272     $self->{method} = $1;
273     $self->{uri} = $2;
274 root 1.17 $self->{version} = $3;
275    
276 root 1.20 $3 =~ /^1\./
277 root 1.17 or $self->err(506, "http protocol version $3 not supported");
278 root 1.1
279     # parse headers
280     {
281     my (%hdr, $h, $v);
282    
283     $hdr{lc $1} .= ",$2"
284     while $req =~ /\G
285     ([^:\000-\040]+):
286     [\008\040]*
287     ((?: [^\015\012]+ | \015\012[\008\040] )*)
288     \015\012
289     /gxc;
290    
291     $req =~ /\G\015\012$/
292     or $self->err(400, "bad request");
293    
294     $self->{h}{$h} = substr $v, 1
295     while ($h, $v) = each %hdr;
296     }
297    
298 root 1.29 # find out server name and port
299     if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
300     $host = $1;
301     } else {
302     $host = $self->{h}{host};
303     }
304    
305     if (defined $host) {
306     $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
307     } else {
308     ($self->{server_port}, $host)
309     = unpack_sockaddr_in $self->{fh}->getsockname
310     or $self->err(500, "unable to get socket name");
311     $host = inet_ntoa $host;
312     }
313    
314     $self->{server_name} = $host;
315    
316     # remote id should be unique per user
317     $self->{remote_id} = $self->{remote_addr};
318    
319     if (exists $self->{h}{"client-ip"}) {
320     $self->{remote_id} .= "[".$self->{h}{"client-ip"}."]";
321     } elsif (exists $self->{h}{"x-forwarded-for"}) {
322     $self->{remote_id} .= "[".$self->{h}{"x-forwarded-for"}."]";
323     }
324 root 1.3
325 root 1.13 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
326 root 1.1
327 root 1.24 eval {
328     $self->map_uri;
329     $self->respond;
330     };
331    
332 root 1.26 $self->eoconn;
333    
334 root 1.24 die if $@ && !ref $@;
335 root 1.17
336 root 1.29 last if $self->{h}{connection} =~ /close/ || $self->{version} < 1.1;
337 root 1.17
338     $fh->timeout($::PER_TIMEOUT);
339     }
340 root 1.1 }
341    
342     # uri => path mapping
343     sub map_uri {
344     my $self = shift;
345 root 1.29 my $host = $self->{server_name};
346 root 1.1 my $uri = $self->{uri};
347    
348     # some massaging, also makes it more secure
349     $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
350     $uri =~ s%//+%/%g;
351     $uri =~ s%/\.(?=/|$)%%g;
352     1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
353    
354     $uri =~ m%^/?\.\.(?=/|$)%
355     and $self->err(400, "bad request");
356    
357     $self->{name} = $uri;
358    
359     # now do the path mapping
360     $self->{path} = "$::DOCROOT/$host$uri";
361 root 1.7
362     $self->access_check;
363 root 1.1 }
364    
365     sub _cgi {
366     my $self = shift;
367     my $path = shift;
368     my $fh;
369    
370     # no two-way xxx supported
371     if (0 == fork) {
372     open STDOUT, ">&".fileno($self->{fh});
373     if (chdir $::DOCROOT) {
374     $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
375 root 1.29 $ENV{HTTP_HOST} = $self->{server_name};
376     $ENV{HTTP_PORT} = $self->{server_port};
377 root 1.1 $ENV{SCRIPT_NAME} = $self->{name};
378 root 1.10 exec $path;
379 root 1.1 }
380     Coro::State::_exit(0);
381     } else {
382 root 1.29 die;
383 root 1.1 }
384     }
385    
386 root 1.29 sub server_hostport {
387     $_[0]{server_port} == 80
388     ? $_[0]{server_name}
389     : "$_[0]{server_name}:$_[0]{server_port}";
390     }
391    
392 root 1.1 sub respond {
393     my $self = shift;
394     my $path = $self->{path};
395    
396     stat $path
397     or $self->err(404, "not found");
398    
399 root 1.10 $self->{stat} = [stat _];
400    
401 root 1.1 # idiotic netscape sends idiotic headers AGAIN
402     my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
403     ? str2time $1 : 0;
404    
405     if (-d _ && -r _) {
406     # directory
407     if ($path !~ /\/$/) {
408     # create a redirect to get the trailing "/"
409 root 1.29 # we don't try to avoid the :80
410     $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
411 root 1.1 } else {
412 root 1.10 $ims < $self->{stat}[9]
413 root 1.1 or $self->err(304, "not modified");
414    
415 root 1.25 if (-r "$path/index.html") {
416     $self->{path} .= "/index.html";
417     $self->handle_file;
418     } else {
419     $self->handle_dir;
420 root 1.1 }
421     }
422     } elsif (-f _ && -r _) {
423     -x _ and $self->err(403, "forbidden");
424     $self->handle_file;
425     } else {
426     $self->err(404, "not found");
427     }
428     }
429    
430     sub handle_dir {
431     my $self = shift;
432 root 1.10 my $idx = $self->diridx;
433    
434     $self->response(200, "ok",
435     {
436     "Content-Type" => "text/html",
437     "Content-Length" => length $idx,
438     },
439     $idx);
440 root 1.1 }
441    
442     sub handle_file {
443     my $self = shift;
444     my $length = -s _;
445     my $hdr = {
446     "Last-Modified" => time2str ((stat _)[9]),
447     };
448    
449     my @code = (200, "ok");
450     my ($l, $h);
451    
452     if ($self->{h}{range} =~ /^bytes=(.*)$/) {
453     for (split /,/, $1) {
454     if (/^-(\d+)$/) {
455     ($l, $h) = ($length - $1, $length - 1);
456     } elsif (/^(\d+)-(\d*)$/) {
457     ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
458     } else {
459     ($l, $h) = (0, $length - 1);
460     goto ignore;
461     }
462 root 1.26 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
463 root 1.1 }
464     $hdr->{"Content-Range"} = "bytes */$length";
465 root 1.24 $hdr->{"Content-Length"} = $length;
466 root 1.20 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
467 root 1.24 $self->err(416, "not satisfiable", $hdr, "");
468 root 1.1
469     satisfiable:
470 root 1.4 # check for segmented downloads
471 root 1.10 if ($l && $::NO_SEGMENTED) {
472 root 1.29 my $delay = 60;
473     while (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
474     if ($delay <= 0) {
475     $self->err(400, "segmented downloads are not allowed",
476     { "Content-Type" => "text/html", Connection => "close" }, <<EOF);
477 root 1.28 <html>
478     <head>
479     <title>Segmented downloads are not allowed</title>
480     </head>
481     <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
482    
483     <p>Segmented downloads are not allowed on this server. Please refer to the
484     <a href="http://www.goof.com/pcg/marc/animefaq.html#segmented_downloads">FAQ</a>.</p>
485    
486     </body></html>
487     EOF
488 root 1.29 } else {
489     Coro::Event::do_timer(after => 3); $delay -= 3;
490     }
491 root 1.4 }
492     }
493    
494 root 1.1 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
495     @code = (206, "partial content");
496     $length = $h - $l + 1;
497    
498     ignore:
499     } else {
500     ($l, $h) = (0, $length - 1);
501     }
502    
503 root 1.9 $self->{path} =~ /\.([^.]+)$/;
504     $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
505 root 1.1 $hdr->{"Content-Length"} = $length;
506    
507 root 1.4 $self->response(@code, $hdr, "");
508 root 1.1
509     if ($self->{method} eq "GET") {
510 root 1.16 my ($fh, $buf, $r);
511     my $current = $Coro::current;
512 root 1.1 open $fh, "<", $self->{path}
513     or die "$self->{path}: late open failure ($!)";
514    
515     $h -= $l - 1;
516    
517 root 1.19 if (0) {
518     if ($l) {
519     sysseek $fh, $l, 0;
520     }
521     }
522    
523 root 1.1 while ($h > 0) {
524 root 1.19 if (0) {
525     sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
526     or last;
527     } else {
528 root 1.29 undef $buf;
529     $aio_requests->down;
530 root 1.19 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
531     $buf, 0, sub {
532     $r = $_[0];
533     $current->ready;
534     });
535     &Coro::schedule;
536 root 1.29 $aio_requests->up;
537 root 1.19 last unless $r;
538     }
539 root 1.11 my $w = $self->{fh}->syswrite($buf)
540 root 1.1 or last;
541 root 1.11 $::written += $w;
542     $self->{written} += $w;
543 root 1.16 $l += $r;
544 root 1.1 }
545     }
546    
547     close $fh;
548 root 1.7 }
549    
550 root 1.2 1;