ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.24
Committed: Sat Aug 18 13:32:17 2001 UTC (22 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.23: +8 -3 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5
6 no utf8;
7 use bytes;
8
9 # at least on my machine, this thingy serves files
10 # quite a bit faster than apache, ;)
11 # and quite a bit slower than thttpd :(
12
13 $SIG{PIPE} = 'IGNORE';
14
15 sub slog {
16 my $level = shift;
17 my $format = shift;
18 printf "---: $format\n", @_;
19 }
20
21 my $connections = new Coro::Semaphore $MAX_CONNECTS;
22
23 my @newcons;
24 my @pool;
25
26 # one "execution thread"
27 sub handler {
28 while () {
29 my $new = pop @newcons;
30 if ($new) {
31 eval {
32 conn->new(@$new)->handle;
33 };
34 slog 1, "$@" if $@ && !ref $@;
35 $connections->up;
36 } else {
37 last if @pool >= $MAX_POOL;
38 push @pool, $Coro::current;
39 schedule;
40 }
41 }
42 }
43
44 my $http_port = new Coro::Socket
45 LocalAddr => $SERVER_HOST,
46 LocalPort => $SERVER_PORT,
47 ReuseAddr => 1,
48 Listen => 50,
49 or die "unable to start server";
50
51 push @listen_sockets, $http_port;
52
53 # the "main thread"
54 async {
55 slog 1, "accepting connections";
56 while () {
57 $connections->down;
58 push @newcons, [$http_port->accept];
59 #slog 3, "accepted @$connections ".scalar(@pool);
60 $::NOW = time;
61 if (@pool) {
62 (pop @pool)->ready;
63 } else {
64 async \&handler;
65 }
66
67 }
68 };
69
70 package conn;
71
72 use Socket;
73 use HTTP::Date;
74 use Convert::Scalar 'weaken';
75 use Linux::AIO;
76
77 Linux::AIO::min_parallel $::AIO_PARALLEL;
78
79 Event->io(fd => Linux::AIO::poll_fileno,
80 poll => 'r', async => 1,
81 cb => \&Linux::AIO::poll_cb);
82
83 our %conn; # $conn{ip}{fh} => connobj
84 our %blocked;
85 our %mimetype;
86
87 sub read_mimetypes {
88 local *M;
89 if (open M, "<mime_types") {
90 while (<M>) {
91 if (/^([^#]\S+)\t+(\S+)$/) {
92 $mimetype{lc $1} = $2;
93 }
94 }
95 } else {
96 print "cannot open mime_types\n";
97 }
98 }
99
100 read_mimetypes;
101
102 sub new {
103 my $class = shift;
104 my $peername = shift;
105 my $fh = shift;
106 my $self = bless { fh => $fh }, $class;
107 my (undef, $iaddr) = unpack_sockaddr_in $peername
108 or $self->err(500, "unable to decode peername");
109
110 $self->{remote_addr} = inet_ntoa $iaddr;
111 $self->{time} = $::NOW;
112
113 # enter ourselves into various lists
114 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
115
116 $::conns++;
117
118 $self;
119 }
120
121 sub DESTROY {
122 my $self = shift;
123
124 $::conns--;
125
126 $self->eoconn;
127 delete $conn{$self->{remote_addr}}{$self*1};
128 }
129
130 # end of connection
131 sub eoconn {
132 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
133 }
134
135 sub slog {
136 my $self = shift;
137 main::slog($_[0], "$self->{remote_addr}> $_[1]");
138 }
139
140 sub response {
141 my ($self, $code, $msg, $hdr, $content) = @_;
142 my $res = "HTTP/1.1 $code $msg\015\012";
143
144 #$res .= "Connection: close\015\012";
145 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
146
147 while (my ($h, $v) = each %$hdr) {
148 $res .= "$h: $v\015\012"
149 }
150 $res .= "\015\012";
151
152 $res .= $content if defined $content and $self->{method} ne "HEAD";
153
154 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d#
155
156 $self->{written} +=
157 print {$self->{fh}} $res;
158 }
159
160 sub err {
161 my $self = shift;
162 my ($code, $msg, $hdr, $content) = @_;
163
164 unless (defined $content) {
165 $content = "$code $msg";
166 $hdr->{"Content-Type"} = "text/plain";
167 $hdr->{"Content-Length"} = length $content;
168 }
169 $hdr->{"Connection"} = "close";
170
171 $self->response($code, $msg, $hdr, $content);
172
173 die bless {}, err::;
174 }
175
176 sub err_blocked {
177 my $self = shift;
178 my $ip = $self->{remote_addr};
179 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
180
181 Coro::Event::do_timer(after => 20*rand);
182
183 $self->err(401, "too many connections",
184 {
185 "Content-Type" => "text/html",
186 "Retry-After" => $::BLOCKTIME,
187 "Warning" => "Please do NOT retry, you have been blocked",
188 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
189 },
190 <<EOF);
191 <html><p>
192 You have been blocked because you opened too many connections. You
193 may retry at</p>
194
195 <p><blockquote>$time.</blockquote></p>
196
197 <p>Until then, each new access will renew the block. You might want to have a
198 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
199 </html>
200 EOF
201 }
202
203 sub handle {
204 my $self = shift;
205 my $fh = $self->{fh};
206
207 $fh->timeout($::REQ_TIMEOUT);
208 while() {
209 $self->{reqs}++;
210
211 # read request and parse first line
212 my $req = $fh->readline("\015\012\015\012");
213
214 unless (defined $req) {
215 if (exists $self->{version}) {
216 last;
217 } else {
218 $self->err(408, "request timeout");
219 }
220 }
221
222 $self->{h} = {};
223
224 $fh->timeout($::RES_TIMEOUT);
225 my $ip = $self->{remote_addr};
226
227 if ($blocked{$ip}) {
228 $self->err_blocked($blocked{$ip})
229 if $blocked{$ip} > $::NOW;
230
231 delete $blocked{$ip};
232 }
233
234 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
235 $self->slog(2, "blocked ip $ip");
236 $self->err_blocked;
237 }
238
239 $req =~ /^(?:\015\012)?
240 (GET|HEAD) \040+
241 ([^\040]+) \040+
242 HTTP\/([0-9]+\.[0-9]+)
243 \015\012/gx
244 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
245
246 $self->{method} = $1;
247 $self->{uri} = $2;
248 $self->{version} = $3;
249
250 $3 =~ /^1\./
251 or $self->err(506, "http protocol version $3 not supported");
252
253 # parse headers
254 {
255 my (%hdr, $h, $v);
256
257 $hdr{lc $1} .= ",$2"
258 while $req =~ /\G
259 ([^:\000-\040]+):
260 [\008\040]*
261 ((?: [^\015\012]+ | \015\012[\008\040] )*)
262 \015\012
263 /gxc;
264
265 $req =~ /\G\015\012$/
266 or $self->err(400, "bad request");
267
268 $self->{h}{$h} = substr $v, 1
269 while ($h, $v) = each %hdr;
270 }
271
272 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80;
273
274 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
275
276 eval {
277 $self->map_uri;
278 $self->respond;
279 };
280
281 die if $@ && !ref $@;
282
283 $self->eoconn;
284
285 last if $self->{h}{connection} =~ /close/ || $self->{version} lt "1.1";
286
287 $self->slog(9, "persistent connection [".$self->{h}{"user-agent"}."][$self->{reqs}]");
288 $fh->timeout($::PER_TIMEOUT);
289 }
290 }
291
292 # uri => path mapping
293 sub map_uri {
294 my $self = shift;
295 my $host = $self->{h}{host} || "default";
296 my $uri = $self->{uri};
297
298 # some massaging, also makes it more secure
299 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
300 $uri =~ s%//+%/%g;
301 $uri =~ s%/\.(?=/|$)%%g;
302 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
303
304 $uri =~ m%^/?\.\.(?=/|$)%
305 and $self->err(400, "bad request");
306
307 $self->{name} = $uri;
308
309 # now do the path mapping
310 $self->{path} = "$::DOCROOT/$host$uri";
311
312 $self->access_check;
313 }
314
315 sub server_address {
316 my $self = shift;
317 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
318 or $self->err(500, "unable to get socket name");
319 ((inet_ntoa $iaddr), $port);
320 }
321
322 sub server_host {
323 my $self = shift;
324 if (exists $self->{h}{host}) {
325 return $self->{h}{host};
326 } else {
327 return (($self->server_address)[0]);
328 }
329 }
330
331 sub server_hostport {
332 my $self = shift;
333 my ($host, $port);
334 if (exists $self->{h}{host}) {
335 ($host, $port) = ($self->{h}{host}, $self->{server_port});
336 } else {
337 ($host, $port) = $self->server_address;
338 }
339 $port = $port == 80 ? "" : ":$port";
340 $host.$port;
341 }
342
343 sub _cgi {
344 my $self = shift;
345 my $path = shift;
346 my $fh;
347
348 # no two-way xxx supported
349 if (0 == fork) {
350 open STDOUT, ">&".fileno($self->{fh});
351 if (chdir $::DOCROOT) {
352 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
353 $ENV{HTTP_HOST} = $self->server_host;
354 $ENV{HTTP_PORT} = $self->{server_host};
355 $ENV{SCRIPT_NAME} = $self->{name};
356 exec $path;
357 }
358 Coro::State::_exit(0);
359 } else {
360 }
361 }
362
363 sub respond {
364 my $self = shift;
365 my $path = $self->{path};
366
367 stat $path
368 or $self->err(404, "not found");
369
370 $self->{stat} = [stat _];
371
372 # idiotic netscape sends idiotic headers AGAIN
373 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
374 ? str2time $1 : 0;
375
376 if (-d _ && -r _) {
377 # directory
378 if ($path !~ /\/$/) {
379 # create a redirect to get the trailing "/"
380 my $host = $self->server_hostport;
381 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" });
382 } else {
383 $ims < $self->{stat}[9]
384 or $self->err(304, "not modified");
385
386 if ($self->{method} eq "GET") {
387 if (-r "$path/index.html") {
388 $self->{path} .= "/index.html";
389 $self->handle_file;
390 } else {
391 $self->handle_dir;
392 }
393 }
394 }
395 } elsif (-f _ && -r _) {
396 -x _ and $self->err(403, "forbidden");
397 $self->handle_file;
398 } else {
399 $self->err(404, "not found");
400 }
401 }
402
403 sub handle_dir {
404 my $self = shift;
405 my $idx = $self->diridx;
406
407 $self->response(200, "ok",
408 {
409 "Content-Type" => "text/html",
410 "Content-Length" => length $idx,
411 },
412 $idx);
413 }
414
415 sub handle_file {
416 my $self = shift;
417 my $length = -s _;
418 my $hdr = {
419 "Last-Modified" => time2str ((stat _)[9]),
420 };
421
422 my @code = (200, "ok");
423 my ($l, $h);
424
425 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
426 for (split /,/, $1) {
427 if (/^-(\d+)$/) {
428 ($l, $h) = ($length - $1, $length - 1);
429 } elsif (/^(\d+)-(\d*)$/) {
430 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
431 } else {
432 ($l, $h) = (0, $length - 1);
433 goto ignore;
434 }
435 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l;
436 }
437 $hdr->{"Content-Range"} = "bytes */$length";
438 $hdr->{"Content-Length"} = $length;
439 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
440 $self->err(416, "not satisfiable", $hdr, "");
441
442 satisfiable:
443 # check for segmented downloads
444 if ($l && $::NO_SEGMENTED) {
445 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
446 Coro::Event::do_timer(after => 15);
447
448 $self->err(400, "segmented downloads are not allowed");
449 }
450 }
451
452 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
453 @code = (206, "partial content");
454 $length = $h - $l + 1;
455
456 ignore:
457 } else {
458 ($l, $h) = (0, $length - 1);
459 }
460
461 $self->{path} =~ /\.([^.]+)$/;
462 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
463 $hdr->{"Content-Length"} = $length;
464
465 $self->response(@code, $hdr, "");
466
467 if ($self->{method} eq "GET") {
468 my ($fh, $buf, $r);
469 my $current = $Coro::current;
470 open $fh, "<", $self->{path}
471 or die "$self->{path}: late open failure ($!)";
472
473 $h -= $l - 1;
474
475 if (0) {
476 if ($l) {
477 sysseek $fh, $l, 0;
478 }
479 }
480
481 while ($h > 0) {
482 if (0) {
483 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
484 or last;
485 } else {
486 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
487 $buf, 0, sub {
488 $r = $_[0];
489 $current->ready;
490 });
491 &Coro::schedule;
492 last unless $r;
493 }
494 my $w = $self->{fh}->syswrite($buf)
495 or last;
496 $::written += $w;
497 $self->{written} += $w;
498 $l += $r;
499 }
500 }
501
502 close $fh;
503 }
504
505 1;