ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.26
Committed: Sun Aug 19 22:59:35 2001 UTC (22 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.25: +6 -6 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5
6 no utf8;
7 use bytes;
8
9 # at least on my machine, this thingy serves files
10 # quite a bit faster than apache, ;)
11 # and quite a bit slower than thttpd :(
12
13 $SIG{PIPE} = 'IGNORE';
14
15 sub slog {
16 my $level = shift;
17 my $format = shift;
18 printf "---: $format\n", @_;
19 }
20
21 my $connections = new Coro::Semaphore $MAX_CONNECTS;
22
23 my @newcons;
24 my @pool;
25
26 # one "execution thread"
27 sub handler {
28 while () {
29 my $new = pop @newcons;
30 if ($new) {
31 eval {
32 conn->new(@$new)->handle;
33 };
34 slog 1, "$@" if $@ && !ref $@;
35 $connections->up;
36 } else {
37 last if @pool >= $MAX_POOL;
38 push @pool, $Coro::current;
39 schedule;
40 }
41 }
42 }
43
44 my $http_port = new Coro::Socket
45 LocalAddr => $SERVER_HOST,
46 LocalPort => $SERVER_PORT,
47 ReuseAddr => 1,
48 Listen => 50,
49 or die "unable to start server";
50
51 push @listen_sockets, $http_port;
52
53 # the "main thread"
54 async {
55 slog 1, "accepting connections";
56 while () {
57 $connections->down;
58 push @newcons, [$http_port->accept];
59 #slog 3, "accepted @$connections ".scalar(@pool);
60 $::NOW = time;
61 if (@pool) {
62 (pop @pool)->ready;
63 } else {
64 async \&handler;
65 }
66
67 }
68 };
69
70 package conn;
71
72 use Socket;
73 use HTTP::Date;
74 use Convert::Scalar 'weaken';
75 use Linux::AIO;
76
77 Linux::AIO::min_parallel $::AIO_PARALLEL;
78
79 Event->io(fd => Linux::AIO::poll_fileno,
80 poll => 'r', async => 1,
81 cb => \&Linux::AIO::poll_cb);
82
83 our %conn; # $conn{ip}{self} => connobj
84 our %uri; # $uri{ip}{uri}{self}
85 our %blocked;
86 our %mimetype;
87
88 sub read_mimetypes {
89 local *M;
90 if (open M, "<mime_types") {
91 while (<M>) {
92 if (/^([^#]\S+)\t+(\S+)$/) {
93 $mimetype{lc $1} = $2;
94 }
95 }
96 } else {
97 print "cannot open mime_types\n";
98 }
99 }
100
101 read_mimetypes;
102
103 sub new {
104 my $class = shift;
105 my $peername = shift;
106 my $fh = shift;
107 my $self = bless { fh => $fh }, $class;
108 my (undef, $iaddr) = unpack_sockaddr_in $peername
109 or $self->err(500, "unable to decode peername");
110
111 $self->{remote_addr} = inet_ntoa $iaddr;
112 $self->{time} = $::NOW;
113
114 # enter ourselves into various lists
115 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
116
117 $::conns++;
118
119 $self;
120 }
121
122 sub DESTROY {
123 my $self = shift;
124
125 $::conns--;
126
127 $self->eoconn;
128 delete $conn{$self->{remote_addr}}{$self*1};
129 }
130
131 # end of connection
132 sub eoconn {
133 my $self = shift;
134 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
135 }
136
137 sub slog {
138 my $self = shift;
139 main::slog($_[0], "$self->{remote_addr}> $_[1]");
140 }
141
142 sub response {
143 my ($self, $code, $msg, $hdr, $content) = @_;
144 my $res = "HTTP/1.1 $code $msg\015\012";
145
146 #$res .= "Connection: close\015\012";
147 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
148
149 while (my ($h, $v) = each %$hdr) {
150 $res .= "$h: $v\015\012"
151 }
152 $res .= "\015\012";
153
154 $res .= $content if defined $content and $self->{method} ne "HEAD";
155
156 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
157
158 $self->{written} +=
159 print {$self->{fh}} $res;
160 }
161
162 sub err {
163 my $self = shift;
164 my ($code, $msg, $hdr, $content) = @_;
165
166 unless (defined $content) {
167 $content = "$code $msg";
168 $hdr->{"Content-Type"} = "text/plain";
169 $hdr->{"Content-Length"} = length $content;
170 }
171 $hdr->{"Connection"} = "close";
172
173 $self->response($code, $msg, $hdr, $content);
174
175 die bless {}, err::;
176 }
177
178 sub err_blocked {
179 my $self = shift;
180 my $ip = $self->{remote_addr};
181 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
182
183 Coro::Event::do_timer(after => 20*rand);
184
185 $self->err(401, "too many connections",
186 {
187 "Content-Type" => "text/html",
188 "Retry-After" => $::BLOCKTIME,
189 "Warning" => "Please do NOT retry, you have been blocked",
190 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
191 },
192 <<EOF);
193 <html><p>
194 You have been blocked because you opened too many connections. You
195 may retry at</p>
196
197 <p><blockquote>$time.</blockquote></p>
198
199 <p>Until then, each new access will renew the block. You might want to have a
200 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
201 </html>
202 EOF
203 }
204
205 sub handle {
206 my $self = shift;
207 my $fh = $self->{fh};
208
209 $fh->timeout($::REQ_TIMEOUT);
210 while() {
211 $self->{reqs}++;
212
213 # read request and parse first line
214 my $req = $fh->readline("\015\012\015\012");
215
216 unless (defined $req) {
217 if (exists $self->{version}) {
218 last;
219 } else {
220 $self->err(408, "request timeout");
221 }
222 }
223
224 $self->{h} = {};
225
226 $fh->timeout($::RES_TIMEOUT);
227 my $ip = $self->{remote_addr};
228
229 if ($blocked{$ip}) {
230 $self->err_blocked($blocked{$ip})
231 if $blocked{$ip} > $::NOW;
232
233 delete $blocked{$ip};
234 }
235
236 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
237 $self->slog(2, "blocked ip $ip");
238 $self->err_blocked;
239 }
240
241 $req =~ /^(?:\015\012)?
242 (GET|HEAD) \040+
243 ([^\040]+) \040+
244 HTTP\/([0-9]+\.[0-9]+)
245 \015\012/gx
246 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
247
248 $self->{method} = $1;
249 $self->{uri} = $2;
250 $self->{version} = $3;
251
252 $3 =~ /^1\./
253 or $self->err(506, "http protocol version $3 not supported");
254
255 # parse headers
256 {
257 my (%hdr, $h, $v);
258
259 $hdr{lc $1} .= ",$2"
260 while $req =~ /\G
261 ([^:\000-\040]+):
262 [\008\040]*
263 ((?: [^\015\012]+ | \015\012[\008\040] )*)
264 \015\012
265 /gxc;
266
267 $req =~ /\G\015\012$/
268 or $self->err(400, "bad request");
269
270 $self->{h}{$h} = substr $v, 1
271 while ($h, $v) = each %hdr;
272 }
273
274 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80;
275
276 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
277
278 eval {
279 $self->map_uri;
280 $self->respond;
281 };
282
283 $self->eoconn;
284
285 die if $@ && !ref $@;
286
287 last if $self->{h}{connection} =~ /close/ || $self->{version} lt "1.1";
288
289 $self->slog(9, "persistent connection [".$self->{h}{"user-agent"}."][$self->{reqs}]");
290 $fh->timeout($::PER_TIMEOUT);
291 }
292 }
293
294 # uri => path mapping
295 sub map_uri {
296 my $self = shift;
297 my $host = $self->{h}{host} || "default";
298 my $uri = $self->{uri};
299
300 # some massaging, also makes it more secure
301 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
302 $uri =~ s%//+%/%g;
303 $uri =~ s%/\.(?=/|$)%%g;
304 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
305
306 $uri =~ m%^/?\.\.(?=/|$)%
307 and $self->err(400, "bad request");
308
309 $self->{name} = $uri;
310
311 # now do the path mapping
312 $self->{path} = "$::DOCROOT/$host$uri";
313
314 $self->access_check;
315 }
316
317 sub server_address {
318 my $self = shift;
319 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
320 or $self->err(500, "unable to get socket name");
321 ((inet_ntoa $iaddr), $port);
322 }
323
324 sub server_host {
325 my $self = shift;
326 if (exists $self->{h}{host}) {
327 return $self->{h}{host};
328 } else {
329 return (($self->server_address)[0]);
330 }
331 }
332
333 sub server_hostport {
334 my $self = shift;
335 my ($host, $port);
336 if (exists $self->{h}{host}) {
337 ($host, $port) = ($self->{h}{host}, $self->{server_port});
338 } else {
339 ($host, $port) = $self->server_address;
340 }
341 $port = $port == 80 ? "" : ":$port";
342 $host.$port;
343 }
344
345 sub _cgi {
346 my $self = shift;
347 my $path = shift;
348 my $fh;
349
350 # no two-way xxx supported
351 if (0 == fork) {
352 open STDOUT, ">&".fileno($self->{fh});
353 if (chdir $::DOCROOT) {
354 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
355 $ENV{HTTP_HOST} = $self->server_host;
356 $ENV{HTTP_PORT} = $self->{server_host};
357 $ENV{SCRIPT_NAME} = $self->{name};
358 exec $path;
359 }
360 Coro::State::_exit(0);
361 } else {
362 }
363 }
364
365 sub respond {
366 my $self = shift;
367 my $path = $self->{path};
368
369 stat $path
370 or $self->err(404, "not found");
371
372 $self->{stat} = [stat _];
373
374 # idiotic netscape sends idiotic headers AGAIN
375 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
376 ? str2time $1 : 0;
377
378 if (-d _ && -r _) {
379 # directory
380 if ($path !~ /\/$/) {
381 # create a redirect to get the trailing "/"
382 my $host = $self->server_hostport;
383 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" });
384 } else {
385 $ims < $self->{stat}[9]
386 or $self->err(304, "not modified");
387
388 if (-r "$path/index.html") {
389 $self->{path} .= "/index.html";
390 $self->handle_file;
391 } else {
392 $self->handle_dir;
393 }
394 }
395 } elsif (-f _ && -r _) {
396 -x _ and $self->err(403, "forbidden");
397 $self->handle_file;
398 } else {
399 $self->err(404, "not found");
400 }
401 }
402
403 sub handle_dir {
404 my $self = shift;
405 my $idx = $self->diridx;
406
407 $self->response(200, "ok",
408 {
409 "Content-Type" => "text/html",
410 "Content-Length" => length $idx,
411 },
412 $idx);
413 }
414
415 sub handle_file {
416 my $self = shift;
417 my $length = -s _;
418 my $hdr = {
419 "Last-Modified" => time2str ((stat _)[9]),
420 };
421
422 my @code = (200, "ok");
423 my ($l, $h);
424
425 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
426 for (split /,/, $1) {
427 if (/^-(\d+)$/) {
428 ($l, $h) = ($length - $1, $length - 1);
429 } elsif (/^(\d+)-(\d*)$/) {
430 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
431 } else {
432 ($l, $h) = (0, $length - 1);
433 goto ignore;
434 }
435 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
436 }
437 $hdr->{"Content-Range"} = "bytes */$length";
438 $hdr->{"Content-Length"} = $length;
439 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
440 $self->err(416, "not satisfiable", $hdr, "");
441
442 satisfiable:
443 # check for segmented downloads
444 if ($l && $::NO_SEGMENTED) {
445 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
446 $self->err(400, "segmented downloads are not allowed");
447 }
448 }
449
450 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
451 @code = (206, "partial content");
452 $length = $h - $l + 1;
453
454 ignore:
455 } else {
456 ($l, $h) = (0, $length - 1);
457 }
458
459 $self->{path} =~ /\.([^.]+)$/;
460 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
461 $hdr->{"Content-Length"} = $length;
462
463 $self->response(@code, $hdr, "");
464
465 if ($self->{method} eq "GET") {
466 my ($fh, $buf, $r);
467 my $current = $Coro::current;
468 open $fh, "<", $self->{path}
469 or die "$self->{path}: late open failure ($!)";
470
471 $h -= $l - 1;
472
473 if (0) {
474 if ($l) {
475 sysseek $fh, $l, 0;
476 }
477 }
478
479 while ($h > 0) {
480 if (0) {
481 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
482 or last;
483 } else {
484 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
485 $buf, 0, sub {
486 $r = $_[0];
487 $current->ready;
488 });
489 &Coro::schedule;
490 last unless $r;
491 }
492 my $w = $self->{fh}->syswrite($buf)
493 or last;
494 $::written += $w;
495 $self->{written} += $w;
496 $l += $r;
497 }
498 }
499
500 close $fh;
501 }
502
503 1;