ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.28
Committed: Mon Aug 20 16:58:19 2001 UTC (22 years, 11 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.27: +18 -3 lines
Log Message:
*** empty log message ***

File Contents

# User Rev Content
1 root 1.1 use Coro;
2     use Coro::Semaphore;
3     use Coro::Event;
4     use Coro::Socket;
5    
6     no utf8;
7     use bytes;
8    
9     # at least on my machine, this thingy serves files
10     # quite a bit faster than apache, ;)
11     # and quite a bit slower than thttpd :(
12    
13     $SIG{PIPE} = 'IGNORE';
14 root 1.27
15     our $accesslog;
16    
17     if ($ACCESS_LOG) {
18     use IO::Handle;
19     open $accesslog, ">>$ACCESS_LOG"
20     or die "$ACCESS_LOG: $!";
21     $accesslog->autoflush(1);
22     }
23    
24 root 1.1 sub slog {
25     my $level = shift;
26     my $format = shift;
27     printf "---: $format\n", @_;
28     }
29    
30     my $connections = new Coro::Semaphore $MAX_CONNECTS;
31    
32 root 1.6 my @newcons;
33 root 1.1 my @pool;
34    
35 root 1.2 # one "execution thread"
36 root 1.1 sub handler {
37     while () {
38 root 1.6 my $new = pop @newcons;
39     if ($new) {
40 root 1.1 eval {
41 root 1.6 conn->new(@$new)->handle;
42 root 1.1 };
43     slog 1, "$@" if $@ && !ref $@;
44     $connections->up;
45     } else {
46     last if @pool >= $MAX_POOL;
47     push @pool, $Coro::current;
48     schedule;
49     }
50     }
51     }
52    
53 root 1.4 my $http_port = new Coro::Socket
54     LocalAddr => $SERVER_HOST,
55     LocalPort => $SERVER_PORT,
56     ReuseAddr => 1,
57 root 1.13 Listen => 50,
58 root 1.4 or die "unable to start server";
59    
60     push @listen_sockets, $http_port;
61    
62 root 1.2 # the "main thread"
63 root 1.1 async {
64     slog 1, "accepting connections";
65     while () {
66     $connections->down;
67 root 1.6 push @newcons, [$http_port->accept];
68 root 1.1 #slog 3, "accepted @$connections ".scalar(@pool);
69 root 1.3 $::NOW = time;
70 root 1.1 if (@pool) {
71     (pop @pool)->ready;
72     } else {
73     async \&handler;
74     }
75    
76     }
77     };
78    
79     package conn;
80    
81     use Socket;
82     use HTTP::Date;
83 root 1.2 use Convert::Scalar 'weaken';
84 root 1.16 use Linux::AIO;
85    
86     Linux::AIO::min_parallel $::AIO_PARALLEL;
87    
88     Event->io(fd => Linux::AIO::poll_fileno,
89 root 1.17 poll => 'r', async => 1,
90 root 1.21 cb => \&Linux::AIO::poll_cb);
91 root 1.16
92 root 1.26 our %conn; # $conn{ip}{self} => connobj
93     our %uri; # $uri{ip}{uri}{self}
94 root 1.3 our %blocked;
95 root 1.9 our %mimetype;
96    
97     sub read_mimetypes {
98     local *M;
99 root 1.10 if (open M, "<mime_types") {
100 root 1.9 while (<M>) {
101     if (/^([^#]\S+)\t+(\S+)$/) {
102     $mimetype{lc $1} = $2;
103     }
104     }
105     } else {
106 root 1.10 print "cannot open mime_types\n";
107 root 1.9 }
108     }
109 root 1.1
110 root 1.10 read_mimetypes;
111    
112 root 1.1 sub new {
113     my $class = shift;
114 root 1.6 my $peername = shift;
115 root 1.1 my $fh = shift;
116 root 1.2 my $self = bless { fh => $fh }, $class;
117 root 1.6 my (undef, $iaddr) = unpack_sockaddr_in $peername
118     or $self->err(500, "unable to decode peername");
119 root 1.7
120 root 1.3 $self->{remote_addr} = inet_ntoa $iaddr;
121 root 1.11 $self->{time} = $::NOW;
122 root 1.2
123     # enter ourselves into various lists
124 root 1.3 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
125    
126 root 1.13 $::conns++;
127    
128 root 1.2 $self;
129     }
130    
131     sub DESTROY {
132     my $self = shift;
133 root 1.13
134     $::conns--;
135    
136 root 1.19 $self->eoconn;
137 root 1.3 delete $conn{$self->{remote_addr}}{$self*1};
138 root 1.19 }
139    
140     # end of connection
141     sub eoconn {
142 root 1.26 my $self = shift;
143 root 1.13 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
144 root 1.1 }
145    
146     sub slog {
147 root 1.4 my $self = shift;
148     main::slog($_[0], "$self->{remote_addr}> $_[1]");
149 root 1.1 }
150    
151 root 1.4 sub response {
152 root 1.1 my ($self, $code, $msg, $hdr, $content) = @_;
153 root 1.17 my $res = "HTTP/1.1 $code $msg\015\012";
154 root 1.1
155 root 1.28 $self->{h}{connection} ||= $hdr->{Connection};
156    
157 root 1.4 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
158 root 1.1
159     while (my ($h, $v) = each %$hdr) {
160     $res .= "$h: $v\015\012"
161     }
162 root 1.10 $res .= "\015\012";
163 root 1.4
164 root 1.13 $res .= $content if defined $content and $self->{method} ne "HEAD";
165 root 1.1
166 root 1.27 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
167    
168     print $accesslog $log if $accesslog;
169     print STDERR $log;
170 root 1.2
171 root 1.11 $self->{written} +=
172     print {$self->{fh}} $res;
173 root 1.1 }
174    
175     sub err {
176     my $self = shift;
177     my ($code, $msg, $hdr, $content) = @_;
178    
179     unless (defined $content) {
180     $content = "$code $msg";
181     $hdr->{"Content-Type"} = "text/plain";
182     $hdr->{"Content-Length"} = length $content;
183     }
184 root 1.17 $hdr->{"Connection"} = "close";
185 root 1.1
186 root 1.4 $self->response($code, $msg, $hdr, $content);
187 root 1.1
188     die bless {}, err::;
189     }
190    
191 root 1.3 sub err_blocked {
192     my $self = shift;
193     my $ip = $self->{remote_addr};
194     my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
195 root 1.10
196 root 1.20 Coro::Event::do_timer(after => 20*rand);
197 root 1.14
198     $self->err(401, "too many connections",
199 root 1.4 {
200     "Content-Type" => "text/html",
201 root 1.20 "Retry-After" => $::BLOCKTIME,
202     "Warning" => "Please do NOT retry, you have been blocked",
203     "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
204 root 1.28 "Connection" => "close",
205 root 1.4 },
206 root 1.3 <<EOF);
207 root 1.27 <html>
208     <head>
209     <title>Too many connections</title>
210     </head>
211     <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
212    
213     <p>You have been blocked because you opened too many connections. You
214 root 1.4 may retry at</p>
215    
216     <p><blockquote>$time.</blockquote></p>
217    
218     <p>Until then, each new access will renew the block. You might want to have a
219 root 1.28 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html#connectionlimit">FAQ</a>.</p>
220 root 1.27
221     </body></html>
222 root 1.3 EOF
223     }
224    
225 root 1.1 sub handle {
226     my $self = shift;
227     my $fh = $self->{fh};
228    
229 root 1.17 $fh->timeout($::REQ_TIMEOUT);
230     while() {
231     $self->{reqs}++;
232 root 1.1
233     # read request and parse first line
234     my $req = $fh->readline("\015\012\015\012");
235    
236 root 1.17 unless (defined $req) {
237     if (exists $self->{version}) {
238     last;
239     } else {
240     $self->err(408, "request timeout");
241     }
242     }
243    
244     $self->{h} = {};
245 root 1.1
246 root 1.17 $fh->timeout($::RES_TIMEOUT);
247 root 1.3 my $ip = $self->{remote_addr};
248    
249     if ($blocked{$ip}) {
250     $self->err_blocked($blocked{$ip})
251     if $blocked{$ip} > $::NOW;
252    
253     delete $blocked{$ip};
254     }
255    
256     if (%{$conn{$ip}} > $::MAX_CONN_IP) {
257 root 1.12 $self->slog(2, "blocked ip $ip");
258 root 1.3 $self->err_blocked;
259     }
260    
261 root 1.1 $req =~ /^(?:\015\012)?
262     (GET|HEAD) \040+
263     ([^\040]+) \040+
264     HTTP\/([0-9]+\.[0-9]+)
265     \015\012/gx
266 root 1.14 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
267 root 1.1
268     $self->{method} = $1;
269     $self->{uri} = $2;
270 root 1.17 $self->{version} = $3;
271    
272 root 1.20 $3 =~ /^1\./
273 root 1.17 or $self->err(506, "http protocol version $3 not supported");
274 root 1.1
275     # parse headers
276     {
277     my (%hdr, $h, $v);
278    
279     $hdr{lc $1} .= ",$2"
280     while $req =~ /\G
281     ([^:\000-\040]+):
282     [\008\040]*
283     ((?: [^\015\012]+ | \015\012[\008\040] )*)
284     \015\012
285     /gxc;
286    
287     $req =~ /\G\015\012$/
288     or $self->err(400, "bad request");
289    
290     $self->{h}{$h} = substr $v, 1
291     while ($h, $v) = each %hdr;
292     }
293    
294     $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80;
295 root 1.3
296 root 1.13 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
297 root 1.1
298 root 1.24 eval {
299     $self->map_uri;
300     $self->respond;
301     };
302    
303 root 1.26 $self->eoconn;
304    
305 root 1.24 die if $@ && !ref $@;
306 root 1.17
307     last if $self->{h}{connection} =~ /close/ || $self->{version} lt "1.1";
308    
309 root 1.19 $self->slog(9, "persistent connection [".$self->{h}{"user-agent"}."][$self->{reqs}]");
310 root 1.17 $fh->timeout($::PER_TIMEOUT);
311     }
312 root 1.1 }
313    
314     # uri => path mapping
315     sub map_uri {
316     my $self = shift;
317     my $host = $self->{h}{host} || "default";
318     my $uri = $self->{uri};
319    
320     # some massaging, also makes it more secure
321     $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
322     $uri =~ s%//+%/%g;
323     $uri =~ s%/\.(?=/|$)%%g;
324     1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
325    
326     $uri =~ m%^/?\.\.(?=/|$)%
327     and $self->err(400, "bad request");
328    
329     $self->{name} = $uri;
330    
331     # now do the path mapping
332     $self->{path} = "$::DOCROOT/$host$uri";
333 root 1.7
334     $self->access_check;
335 root 1.1 }
336    
337     sub server_address {
338     my $self = shift;
339     my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
340     or $self->err(500, "unable to get socket name");
341     ((inet_ntoa $iaddr), $port);
342     }
343    
344     sub server_host {
345     my $self = shift;
346     if (exists $self->{h}{host}) {
347     return $self->{h}{host};
348     } else {
349     return (($self->server_address)[0]);
350     }
351     }
352    
353     sub server_hostport {
354     my $self = shift;
355     my ($host, $port);
356     if (exists $self->{h}{host}) {
357     ($host, $port) = ($self->{h}{host}, $self->{server_port});
358     } else {
359     ($host, $port) = $self->server_address;
360     }
361     $port = $port == 80 ? "" : ":$port";
362     $host.$port;
363     }
364    
365     sub _cgi {
366     my $self = shift;
367     my $path = shift;
368     my $fh;
369    
370     # no two-way xxx supported
371     if (0 == fork) {
372     open STDOUT, ">&".fileno($self->{fh});
373     if (chdir $::DOCROOT) {
374     $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
375     $ENV{HTTP_HOST} = $self->server_host;
376     $ENV{HTTP_PORT} = $self->{server_host};
377     $ENV{SCRIPT_NAME} = $self->{name};
378 root 1.10 exec $path;
379 root 1.1 }
380     Coro::State::_exit(0);
381     } else {
382     }
383     }
384    
385     sub respond {
386     my $self = shift;
387     my $path = $self->{path};
388    
389     stat $path
390     or $self->err(404, "not found");
391    
392 root 1.10 $self->{stat} = [stat _];
393    
394 root 1.1 # idiotic netscape sends idiotic headers AGAIN
395     my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
396     ? str2time $1 : 0;
397    
398     if (-d _ && -r _) {
399     # directory
400     if ($path !~ /\/$/) {
401     # create a redirect to get the trailing "/"
402     my $host = $self->server_hostport;
403     $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" });
404     } else {
405 root 1.10 $ims < $self->{stat}[9]
406 root 1.1 or $self->err(304, "not modified");
407    
408 root 1.25 if (-r "$path/index.html") {
409     $self->{path} .= "/index.html";
410     $self->handle_file;
411     } else {
412     $self->handle_dir;
413 root 1.1 }
414     }
415     } elsif (-f _ && -r _) {
416     -x _ and $self->err(403, "forbidden");
417     $self->handle_file;
418     } else {
419     $self->err(404, "not found");
420     }
421     }
422    
423     sub handle_dir {
424     my $self = shift;
425 root 1.10 my $idx = $self->diridx;
426    
427     $self->response(200, "ok",
428     {
429     "Content-Type" => "text/html",
430     "Content-Length" => length $idx,
431     },
432     $idx);
433 root 1.1 }
434    
435     sub handle_file {
436     my $self = shift;
437     my $length = -s _;
438     my $hdr = {
439     "Last-Modified" => time2str ((stat _)[9]),
440     };
441    
442     my @code = (200, "ok");
443     my ($l, $h);
444    
445     if ($self->{h}{range} =~ /^bytes=(.*)$/) {
446     for (split /,/, $1) {
447     if (/^-(\d+)$/) {
448     ($l, $h) = ($length - $1, $length - 1);
449     } elsif (/^(\d+)-(\d*)$/) {
450     ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
451     } else {
452     ($l, $h) = (0, $length - 1);
453     goto ignore;
454     }
455 root 1.26 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
456 root 1.1 }
457     $hdr->{"Content-Range"} = "bytes */$length";
458 root 1.24 $hdr->{"Content-Length"} = $length;
459 root 1.20 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
460 root 1.24 $self->err(416, "not satisfiable", $hdr, "");
461 root 1.1
462     satisfiable:
463 root 1.4 # check for segmented downloads
464 root 1.10 if ($l && $::NO_SEGMENTED) {
465 root 1.13 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
466 root 1.28 $self->err(400, "segmented downloads are not allowed",
467     { "Content-Type" => "text/html", Connection => "close" }, <<EOF);
468     <html>
469     <head>
470     <title>Segmented downloads are not allowed</title>
471     </head>
472     <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
473    
474     <p>Segmented downloads are not allowed on this server. Please refer to the
475     <a href="http://www.goof.com/pcg/marc/animefaq.html#segmented_downloads">FAQ</a>.</p>
476    
477     </body></html>
478     EOF
479     EOF
480 root 1.4 }
481     }
482    
483 root 1.1 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
484     @code = (206, "partial content");
485     $length = $h - $l + 1;
486    
487     ignore:
488     } else {
489     ($l, $h) = (0, $length - 1);
490     }
491    
492 root 1.9 $self->{path} =~ /\.([^.]+)$/;
493     $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
494 root 1.1 $hdr->{"Content-Length"} = $length;
495    
496 root 1.4 $self->response(@code, $hdr, "");
497 root 1.1
498     if ($self->{method} eq "GET") {
499 root 1.16 my ($fh, $buf, $r);
500     my $current = $Coro::current;
501 root 1.1 open $fh, "<", $self->{path}
502     or die "$self->{path}: late open failure ($!)";
503    
504     $h -= $l - 1;
505    
506 root 1.19 if (0) {
507     if ($l) {
508     sysseek $fh, $l, 0;
509     }
510     }
511    
512 root 1.1 while ($h > 0) {
513 root 1.19 if (0) {
514     sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
515     or last;
516     } else {
517     aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
518     $buf, 0, sub {
519     $r = $_[0];
520     $current->ready;
521     });
522     &Coro::schedule;
523     last unless $r;
524     }
525 root 1.11 my $w = $self->{fh}->syswrite($buf)
526 root 1.1 or last;
527 root 1.11 $::written += $w;
528     $self->{written} += $w;
529 root 1.16 $l += $r;
530 root 1.1 }
531     }
532    
533     close $fh;
534 root 1.7 }
535    
536 root 1.2 1;