ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
Revision: 1.27
Committed: Sun Aug 19 23:57:52 2001 UTC (22 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.26: +23 -5 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5
6 no utf8;
7 use bytes;
8
9 # at least on my machine, this thingy serves files
10 # quite a bit faster than apache, ;)
11 # and quite a bit slower than thttpd :(
12
13 $SIG{PIPE} = 'IGNORE';
14
15 our $accesslog;
16
17 if ($ACCESS_LOG) {
18 use IO::Handle;
19 open $accesslog, ">>$ACCESS_LOG"
20 or die "$ACCESS_LOG: $!";
21 $accesslog->autoflush(1);
22 }
23
24 sub slog {
25 my $level = shift;
26 my $format = shift;
27 printf "---: $format\n", @_;
28 }
29
30 my $connections = new Coro::Semaphore $MAX_CONNECTS;
31
32 my @newcons;
33 my @pool;
34
35 # one "execution thread"
36 sub handler {
37 while () {
38 my $new = pop @newcons;
39 if ($new) {
40 eval {
41 conn->new(@$new)->handle;
42 };
43 slog 1, "$@" if $@ && !ref $@;
44 $connections->up;
45 } else {
46 last if @pool >= $MAX_POOL;
47 push @pool, $Coro::current;
48 schedule;
49 }
50 }
51 }
52
53 my $http_port = new Coro::Socket
54 LocalAddr => $SERVER_HOST,
55 LocalPort => $SERVER_PORT,
56 ReuseAddr => 1,
57 Listen => 50,
58 or die "unable to start server";
59
60 push @listen_sockets, $http_port;
61
62 # the "main thread"
63 async {
64 slog 1, "accepting connections";
65 while () {
66 $connections->down;
67 push @newcons, [$http_port->accept];
68 #slog 3, "accepted @$connections ".scalar(@pool);
69 $::NOW = time;
70 if (@pool) {
71 (pop @pool)->ready;
72 } else {
73 async \&handler;
74 }
75
76 }
77 };
78
79 package conn;
80
81 use Socket;
82 use HTTP::Date;
83 use Convert::Scalar 'weaken';
84 use Linux::AIO;
85
86 Linux::AIO::min_parallel $::AIO_PARALLEL;
87
88 Event->io(fd => Linux::AIO::poll_fileno,
89 poll => 'r', async => 1,
90 cb => \&Linux::AIO::poll_cb);
91
92 our %conn; # $conn{ip}{self} => connobj
93 our %uri; # $uri{ip}{uri}{self}
94 our %blocked;
95 our %mimetype;
96
97 sub read_mimetypes {
98 local *M;
99 if (open M, "<mime_types") {
100 while (<M>) {
101 if (/^([^#]\S+)\t+(\S+)$/) {
102 $mimetype{lc $1} = $2;
103 }
104 }
105 } else {
106 print "cannot open mime_types\n";
107 }
108 }
109
110 read_mimetypes;
111
112 sub new {
113 my $class = shift;
114 my $peername = shift;
115 my $fh = shift;
116 my $self = bless { fh => $fh }, $class;
117 my (undef, $iaddr) = unpack_sockaddr_in $peername
118 or $self->err(500, "unable to decode peername");
119
120 $self->{remote_addr} = inet_ntoa $iaddr;
121 $self->{time} = $::NOW;
122
123 # enter ourselves into various lists
124 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
125
126 $::conns++;
127
128 $self;
129 }
130
131 sub DESTROY {
132 my $self = shift;
133
134 $::conns--;
135
136 $self->eoconn;
137 delete $conn{$self->{remote_addr}}{$self*1};
138 }
139
140 # end of connection
141 sub eoconn {
142 my $self = shift;
143 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
144 }
145
146 sub slog {
147 my $self = shift;
148 main::slog($_[0], "$self->{remote_addr}> $_[1]");
149 }
150
151 sub response {
152 my ($self, $code, $msg, $hdr, $content) = @_;
153 my $res = "HTTP/1.1 $code $msg\015\012";
154
155 #$res .= "Connection: close\015\012";
156 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
157
158 while (my ($h, $v) = each %$hdr) {
159 $res .= "$h: $v\015\012"
160 }
161 $res .= "\015\012";
162
163 $res .= $content if defined $content and $self->{method} ne "HEAD";
164
165 my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
166
167 print $accesslog $log if $accesslog;
168 print STDERR $log;
169
170 $self->{written} +=
171 print {$self->{fh}} $res;
172 }
173
174 sub err {
175 my $self = shift;
176 my ($code, $msg, $hdr, $content) = @_;
177
178 unless (defined $content) {
179 $content = "$code $msg";
180 $hdr->{"Content-Type"} = "text/plain";
181 $hdr->{"Content-Length"} = length $content;
182 }
183 $hdr->{"Connection"} = "close";
184
185 $self->response($code, $msg, $hdr, $content);
186
187 die bless {}, err::;
188 }
189
190 sub err_blocked {
191 my $self = shift;
192 my $ip = $self->{remote_addr};
193 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
194
195 Coro::Event::do_timer(after => 20*rand);
196
197 $self->err(401, "too many connections",
198 {
199 "Content-Type" => "text/html",
200 "Retry-After" => $::BLOCKTIME,
201 "Warning" => "Please do NOT retry, you have been blocked",
202 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
203 },
204 <<EOF);
205 <html>
206 <head>
207 <title>Too many connections</title>
208 </head>
209 <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000">
210
211 <p>You have been blocked because you opened too many connections. You
212 may retry at</p>
213
214 <p><blockquote>$time.</blockquote></p>
215
216 <p>Until then, each new access will renew the block. You might want to have a
217 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
218
219 </body></html>
220 EOF
221 }
222
223 sub handle {
224 my $self = shift;
225 my $fh = $self->{fh};
226
227 $fh->timeout($::REQ_TIMEOUT);
228 while() {
229 $self->{reqs}++;
230
231 # read request and parse first line
232 my $req = $fh->readline("\015\012\015\012");
233
234 unless (defined $req) {
235 if (exists $self->{version}) {
236 last;
237 } else {
238 $self->err(408, "request timeout");
239 }
240 }
241
242 $self->{h} = {};
243
244 $fh->timeout($::RES_TIMEOUT);
245 my $ip = $self->{remote_addr};
246
247 if ($blocked{$ip}) {
248 $self->err_blocked($blocked{$ip})
249 if $blocked{$ip} > $::NOW;
250
251 delete $blocked{$ip};
252 }
253
254 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
255 $self->slog(2, "blocked ip $ip");
256 $self->err_blocked;
257 }
258
259 $req =~ /^(?:\015\012)?
260 (GET|HEAD) \040+
261 ([^\040]+) \040+
262 HTTP\/([0-9]+\.[0-9]+)
263 \015\012/gx
264 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
265
266 $self->{method} = $1;
267 $self->{uri} = $2;
268 $self->{version} = $3;
269
270 $3 =~ /^1\./
271 or $self->err(506, "http protocol version $3 not supported");
272
273 # parse headers
274 {
275 my (%hdr, $h, $v);
276
277 $hdr{lc $1} .= ",$2"
278 while $req =~ /\G
279 ([^:\000-\040]+):
280 [\008\040]*
281 ((?: [^\015\012]+ | \015\012[\008\040] )*)
282 \015\012
283 /gxc;
284
285 $req =~ /\G\015\012$/
286 or $self->err(400, "bad request");
287
288 $self->{h}{$h} = substr $v, 1
289 while ($h, $v) = each %hdr;
290 }
291
292 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80;
293
294 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
295
296 eval {
297 $self->map_uri;
298 $self->respond;
299 };
300
301 $self->eoconn;
302
303 die if $@ && !ref $@;
304
305 last if $self->{h}{connection} =~ /close/ || $self->{version} lt "1.1";
306
307 $self->slog(9, "persistent connection [".$self->{h}{"user-agent"}."][$self->{reqs}]");
308 $fh->timeout($::PER_TIMEOUT);
309 }
310 }
311
312 # uri => path mapping
313 sub map_uri {
314 my $self = shift;
315 my $host = $self->{h}{host} || "default";
316 my $uri = $self->{uri};
317
318 # some massaging, also makes it more secure
319 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
320 $uri =~ s%//+%/%g;
321 $uri =~ s%/\.(?=/|$)%%g;
322 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
323
324 $uri =~ m%^/?\.\.(?=/|$)%
325 and $self->err(400, "bad request");
326
327 $self->{name} = $uri;
328
329 # now do the path mapping
330 $self->{path} = "$::DOCROOT/$host$uri";
331
332 $self->access_check;
333 }
334
335 sub server_address {
336 my $self = shift;
337 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
338 or $self->err(500, "unable to get socket name");
339 ((inet_ntoa $iaddr), $port);
340 }
341
342 sub server_host {
343 my $self = shift;
344 if (exists $self->{h}{host}) {
345 return $self->{h}{host};
346 } else {
347 return (($self->server_address)[0]);
348 }
349 }
350
351 sub server_hostport {
352 my $self = shift;
353 my ($host, $port);
354 if (exists $self->{h}{host}) {
355 ($host, $port) = ($self->{h}{host}, $self->{server_port});
356 } else {
357 ($host, $port) = $self->server_address;
358 }
359 $port = $port == 80 ? "" : ":$port";
360 $host.$port;
361 }
362
363 sub _cgi {
364 my $self = shift;
365 my $path = shift;
366 my $fh;
367
368 # no two-way xxx supported
369 if (0 == fork) {
370 open STDOUT, ">&".fileno($self->{fh});
371 if (chdir $::DOCROOT) {
372 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
373 $ENV{HTTP_HOST} = $self->server_host;
374 $ENV{HTTP_PORT} = $self->{server_host};
375 $ENV{SCRIPT_NAME} = $self->{name};
376 exec $path;
377 }
378 Coro::State::_exit(0);
379 } else {
380 }
381 }
382
383 sub respond {
384 my $self = shift;
385 my $path = $self->{path};
386
387 stat $path
388 or $self->err(404, "not found");
389
390 $self->{stat} = [stat _];
391
392 # idiotic netscape sends idiotic headers AGAIN
393 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
394 ? str2time $1 : 0;
395
396 if (-d _ && -r _) {
397 # directory
398 if ($path !~ /\/$/) {
399 # create a redirect to get the trailing "/"
400 my $host = $self->server_hostport;
401 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" });
402 } else {
403 $ims < $self->{stat}[9]
404 or $self->err(304, "not modified");
405
406 if (-r "$path/index.html") {
407 $self->{path} .= "/index.html";
408 $self->handle_file;
409 } else {
410 $self->handle_dir;
411 }
412 }
413 } elsif (-f _ && -r _) {
414 -x _ and $self->err(403, "forbidden");
415 $self->handle_file;
416 } else {
417 $self->err(404, "not found");
418 }
419 }
420
421 sub handle_dir {
422 my $self = shift;
423 my $idx = $self->diridx;
424
425 $self->response(200, "ok",
426 {
427 "Content-Type" => "text/html",
428 "Content-Length" => length $idx,
429 },
430 $idx);
431 }
432
433 sub handle_file {
434 my $self = shift;
435 my $length = -s _;
436 my $hdr = {
437 "Last-Modified" => time2str ((stat _)[9]),
438 };
439
440 my @code = (200, "ok");
441 my ($l, $h);
442
443 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
444 for (split /,/, $1) {
445 if (/^-(\d+)$/) {
446 ($l, $h) = ($length - $1, $length - 1);
447 } elsif (/^(\d+)-(\d*)$/) {
448 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
449 } else {
450 ($l, $h) = (0, $length - 1);
451 goto ignore;
452 }
453 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
454 }
455 $hdr->{"Content-Range"} = "bytes */$length";
456 $hdr->{"Content-Length"} = $length;
457 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
458 $self->err(416, "not satisfiable", $hdr, "");
459
460 satisfiable:
461 # check for segmented downloads
462 if ($l && $::NO_SEGMENTED) {
463 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
464 $self->err(400, "segmented downloads are not allowed");
465 }
466 }
467
468 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
469 @code = (206, "partial content");
470 $length = $h - $l + 1;
471
472 ignore:
473 } else {
474 ($l, $h) = (0, $length - 1);
475 }
476
477 $self->{path} =~ /\.([^.]+)$/;
478 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
479 $hdr->{"Content-Length"} = $length;
480
481 $self->response(@code, $hdr, "");
482
483 if ($self->{method} eq "GET") {
484 my ($fh, $buf, $r);
485 my $current = $Coro::current;
486 open $fh, "<", $self->{path}
487 or die "$self->{path}: late open failure ($!)";
488
489 $h -= $l - 1;
490
491 if (0) {
492 if ($l) {
493 sysseek $fh, $l, 0;
494 }
495 }
496
497 while ($h > 0) {
498 if (0) {
499 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
500 or last;
501 } else {
502 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
503 $buf, 0, sub {
504 $r = $_[0];
505 $current->ready;
506 });
507 &Coro::schedule;
508 last unless $r;
509 }
510 my $w = $self->{fh}->syswrite($buf)
511 or last;
512 $::written += $w;
513 $self->{written} += $w;
514 $l += $r;
515 }
516 }
517
518 close $fh;
519 }
520
521 1;