ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.85
Committed: Mon Feb 18 17:48:00 2008 UTC (16 years, 4 months ago) by root
Content type: text/plain
Branch: MAIN
CVS Tags: rel-4_741, rel-4_742, rel-4_74, rel-4_71, rel-4_72, rel-4_73, rel-4_50, rel-4_51, rel-4_45, rel-4_49, rel-4_48, rel-4_47, rel-4_46, rel-4_7
Changes since 1.84: +3 -0 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::EV;
4 use Coro::Socket;
5 use Coro::Signal;
6 use Coro::AIO ();
7
8 use HTTP::Date;
9 use POSIX ();
10
11 use Compress::Zlib ();
12
13 no utf8;
14 use bytes;
15
16 # at least on my machine, this thingy serves files
17 # quite a bit faster than apache, ;)
18 # and quite a bit slower than thttpd :(
19
20 $SIG{PIPE} = 'IGNORE';
21
22 our $accesslog;
23 our $errorlog;
24
25 our $NOW;
26 our $HTTP_NOW;
27
28 our $ERROR_LOG;
29 our $ACCESS_LOG;
30
31 our $update_time = EV::periodic 0, 1, undef, sub {
32 $NOW = time;
33 $HTTP_NOW = time2str $NOW;
34 };
35 $update_time->invoke;
36
37 if ($ERROR_LOG) {
38 use IO::Handle;
39 open $errorlog, ">>$ERROR_LOG"
40 or die "$ERROR_LOG: $!";
41 $errorlog->autoflush(1);
42 }
43
44 if ($ACCESS_LOG) {
45 use IO::Handle;
46 open $accesslog, ">>$ACCESS_LOG"
47 or die "$ACCESS_LOG: $!";
48 $accesslog->autoflush(1);
49 }
50
51 sub slog {
52 my $level = shift;
53 my $format = shift;
54 my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW);
55 printf "$NOW: $format\n", @_;
56 printf $errorlog "$NOW: $format\n", @_ if $errorlog;
57 }
58
59 our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
60 our $httpevent = new Coro::Signal;
61
62 our $queue_file = new transferqueue $MAX_TRANSFERS;
63 our $queue_index = new transferqueue 10;
64
65 our $tbf_top = new tbf rate => $TBF_RATE || 100000;
66
67 my $unused_bytes = 0;
68 my $unused_last = time;
69
70 sub unused_bandwidth {
71 $unused_bytes += $_[0];
72 if ($unused_last < $NOW - 30 && $unused_bytes / ($NOW - $unused_last) > 50000) {
73 $unused_last = $NOW;
74 $unused_bytes = 0;
75 $queue_file->force_wake_next;
76 slog 1, "forced filetransfer due to unused bandwidth";
77 }
78 }
79
80 my @newcons;
81 my @pool;
82
83 # one "execution thread"
84 sub handler {
85 while () {
86 if (@newcons) {
87 eval {
88 conn->new (@{pop @newcons})->handle;
89 };
90 slog 1, "$@" if $@ && !ref $@;
91
92 $httpevent->broadcast; # only for testing, but doesn't matter much
93
94 $connections->up;
95 } else {
96 last if @pool >= $MAX_POOL;
97 push @pool, $Coro::current;
98 schedule;
99 }
100 }
101 }
102
103 sub listen_on {
104 my $listen = $_[0];
105
106 push @listen_sockets, $listen;
107
108 # the "main thread"
109 async {
110 slog 1, "accepting connections";
111 while () {
112 $connections->down;
113 push @newcons, [$listen->accept];
114 #slog 3, "accepted @$connections ".scalar(@pool);
115 if (@pool) {
116 (pop @pool)->ready;
117 } else {
118 async \&handler;
119 }
120 }
121 };
122 }
123
124 my $http_port = new Coro::Socket
125 LocalAddr => $SERVER_HOST,
126 LocalPort => $SERVER_PORT,
127 ReuseAddr => 1,
128 Listen => 50,
129 or die "unable to start server";
130
131 listen_on $http_port;
132
133 if ($SERVER_PORT2) {
134 my $http_port = new Coro::Socket
135 LocalAddr => $SERVER_HOST,
136 LocalPort => $SERVER_PORT2,
137 ReuseAddr => 1,
138 Listen => 50,
139 or die "unable to start server";
140
141 listen_on $http_port;
142 }
143
144 package conn;
145
146 use strict;
147 use bytes;
148
149 use Socket;
150 use HTTP::Date;
151 use Convert::Scalar 'weaken';
152 use IO::AIO;
153
154 IO::AIO::min_parallel $::AIO_PARALLEL;
155
156 our $AIO_WATCHER = EV::io IO::AIO::poll_fileno, EV::READ, \&IO::AIO::poll_cb;
157
158 our %conn; # $conn{ip}{self} => connobj
159 our %uri; # $uri{ip}{uri}{self}
160 our %blocked;
161 our %mimetype;
162
163 sub read_mimetypes {
164 if (open my $fh, "<mime_types") {
165 while (<$fh>) {
166 if (/^([^#]\S+)\t+(\S+)$/) {
167 $mimetype{lc $1} = $2;
168 }
169 }
170 } else {
171 print "cannot open mime_types\n";
172 }
173 }
174
175 read_mimetypes;
176
177 sub new {
178 my $class = shift;
179 my $fh = shift;
180 my $peername = shift;
181 my $self = bless { fh => $fh }, $class;
182 my (undef, $iaddr) = unpack_sockaddr_in $peername
183 or $self->err (500, "unable to decode peername");
184
185 $self->{remote_addr} =
186 $self->{remote_id} = inet_ntoa $iaddr;
187
188 $self->{time} = $::NOW;
189
190 weaken ($Coro::current->{conn} = $self);
191
192 ++$::conns;
193 $::maxconns = $::conns if $::conns > $::maxconns;
194
195 $self
196 }
197
198 sub DESTROY {
199 my $self = shift;
200
201 --$::conns;
202 }
203
204 sub prune_cache {
205 my $hash = $_[0];
206
207 for (keys %$hash) {
208 if (ref $hash->{$_} eq HASH::) {
209 prune_cache($hash->{$_});
210 unless (scalar keys %{$hash->{$_}}) {
211 delete $hash->{$_};
212 }
213 }
214 }
215 }
216
217 sub prune_caches {
218 prune_cache \%conn;
219 prune_cache \%uri;
220
221 for (keys %blocked) {
222 delete $blocked{$_} unless $blocked{$_}[0] > $::NOW;
223 }
224 }
225
226 our $PRUNE_WATCHER = EV::timer 60, 60, \&prune_caches;
227
228 sub slog {
229 my $self = shift;
230 main::slog($_[0], "$self->{remote_id}> $_[1]");
231 }
232
233 sub response {
234 my ($self, $code, $msg, $hdr, $content) = @_;
235 my $res = "HTTP/1.1 $code $msg\015\012";
236 my $GZ = "";
237
238 if (exists $hdr->{Connection}) {
239 if ($hdr->{Connection} =~ /close/) {
240 $self->{h}{connection} = "close"
241 }
242 } else {
243 if ($self->{version} < 1.1) {
244 if ($self->{h}{connection} =~ /keep-alive/i) {
245 $hdr->{Connection} = "Keep-Alive";
246 } else {
247 $self->{h}{connection} = "close"
248 }
249 }
250 }
251
252 if ($self->{method} ne "HEAD"
253 && $self->{h}{"accept-encoding"} =~ /\bgzip\b/
254 && 400 < length $content
255 && $hdr->{"Content-Length"} == length $content
256 && !exists $hdr->{"Content-Encoding"}
257 ) {
258 my $orig = length $content;
259 $hdr->{"Content-Encoding"} = "gzip";
260 $content = Compress::Zlib::memGzip(\$content);
261 $hdr->{"Content-Length"} = length $content;
262 $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig);
263 }
264
265 $res .= "Date: $HTTP_NOW\015\012";
266 $res .= "Server: $::NAME\015\012";
267
268 while (my ($h, $v) = each %$hdr) {
269 $res .= "$h: $v\015\012"
270 }
271 $res .= "\015\012";
272
273 $res .= $content if defined $content and $self->{method} ne "HEAD";
274
275 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW).
276 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ.
277 " \"$self->{h}{referer}\"\n";
278
279 print $::accesslog $log if $::accesslog;
280 print STDERR $log;
281
282 $tbf_top->request(length $res, 1e6);
283 $self->{written} += print {$self->{fh}} $res;
284 }
285
286 sub err {
287 my $self = shift;
288 my ($code, $msg, $hdr, $content) = @_;
289
290 unless (defined $content) {
291 $content = "$code $msg\n";
292 $hdr->{"Content-Type"} = "text/plain";
293 $hdr->{"Content-Length"} = length $content;
294 }
295 $hdr->{"Connection"} = "close";
296
297 $self->response ($code, $msg, $hdr, $content);
298
299 die bless {}, err::
300 }
301
302 sub handle {
303 my $self = shift;
304 my $fh = $self->{fh};
305
306 my $host;
307
308 $fh->timeout($::REQ_TIMEOUT);
309 while () {
310 $self->{reqs}++;
311
312 # read request and parse first line
313 my $req = $fh->readline("\015\012\015\012");
314
315 unless (defined $req) {
316 if (exists $self->{version}) {
317 last;
318 } else {
319 $self->err(408, "request timeout");
320 }
321 }
322
323 $self->{h} = {};
324
325 $fh->timeout($::RES_TIMEOUT);
326
327 $req =~ /^(?:\015\012)?
328 (GET|HEAD) \040+
329 ([^\040]+) \040+
330 HTTP\/([0-9]+\.[0-9]+)
331 \015\012/gx
332 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
333
334 $self->{method} = $1;
335 $self->{uri} = $2;
336 $self->{version} = $3;
337
338 $3 =~ /^1\./
339 or $self->err(506, "http protocol version $3 not supported");
340
341 # parse headers
342 {
343 my (%hdr, $h, $v);
344
345 $hdr{lc $1} .= ",$2"
346 while $req =~ /\G
347 ([^:\000-\040]+):
348 [\011\040]*
349 ((?: [^\015\012]+ | \015\012[\011\040] )*)
350 \015\012
351 /gxc;
352
353 $req =~ /\G\015\012$/
354 or $self->err(400, "bad request");
355
356 $self->{h}{$h} = substr $v, 1
357 while ($h, $v) = each %hdr;
358 }
359
360 # remote id should be unique per user
361 my $id = $self->{remote_addr};
362
363 if (exists $self->{h}{"client-ip"}) {
364 $id .= "[".$self->{h}{"client-ip"}."]";
365 } elsif (exists $self->{h}{"x-forwarded-for"}) {
366 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
367 }
368
369 $self->{remote_id} = $id;
370
371 weaken (local $conn{$id}{$self*1} = $self);
372
373 if ($blocked{$id}) {
374 $self->err_blocked
375 if $blocked{$id}[0] > $::NOW;
376
377 delete $blocked{$id};
378 }
379
380 # find out server name and port
381 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
382 $host = $1;
383 } else {
384 $host = $self->{h}{host};
385 }
386
387 if (defined $host) {
388 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
389 } else {
390 ($self->{server_port}, $host)
391 = unpack_sockaddr_in $self->{fh}->sockname
392 or $self->err(500, "unable to get socket name");
393 $host = inet_ntoa $host;
394 }
395
396 $self->{server_name} = $host;
397
398 weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self);
399
400 eval {
401 $self->map_uri;
402 $self->respond;
403 };
404
405 die if $@ && !ref $@;
406
407 last if $self->{h}{connection} =~ /close/i;
408
409 $httpevent->broadcast;
410
411 $fh->timeout($::PER_TIMEOUT);
412 }
413 }
414
415 sub block {
416 my $self = shift;
417
418 $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]];
419 $self->slog(2, "blocked ip $self->{remote_id}");
420 $self->err_blocked;
421 }
422
423 # uri => path mapping
424 sub map_uri {
425 my $self = shift;
426 my $host = $self->{server_name};
427 my $uri = $self->{uri};
428
429 $host =~ /[\/\\]/
430 and $self->err(400, "bad request");
431
432 # some massaging, also makes it more secure
433 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
434 $uri =~ s%//+%/%g;
435 $uri =~ s%/\.(?=/|$)%%g;
436 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
437
438 $uri =~ m%^/?\.\.(?=/|$)%
439 and $self->err(400, "bad request");
440
441 $self->{name} = $uri;
442
443 # now do the path mapping
444 $self->{path} = "$::DOCROOT/$host$uri";
445
446 $self->access_check;
447 }
448
449 sub _cgi {
450 my $self = shift;
451 my $path = shift;
452 my $fh;
453
454 # no two-way xxx supported
455 if (0 == fork) {
456 open STDOUT, ">&".fileno($self->{fh});
457 if (chdir $::DOCROOT) {
458 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
459 $ENV{HTTP_HOST} = $self->{server_name};
460 $ENV{HTTP_PORT} = $self->{server_port};
461 $ENV{SCRIPT_NAME} = $self->{name};
462 exec $path;
463 }
464 Coro::State::_exit(0);
465 } else {
466 die;
467 }
468 }
469
470 sub server_hostport {
471 $_[0]{server_port} == 80
472 ? $_[0]{server_name}
473 : "$_[0]{server_name}:$_[0]{server_port}";
474 }
475
476 sub respond {
477 my $self = shift;
478 my $path = $self->{path};
479
480 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
481 if ($::internal{$1}) {
482 $::internal{$1}->($self);
483 } else {
484 $self->err (404, "not found");
485 }
486 } else {
487
488 stat $path
489 or $self->err (404, "not found");
490
491 $self->{stat} = [stat _];
492
493 # idiotic netscape sends idiotic headers AGAIN
494 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
495 ? str2time $1 : 0;
496
497 if (-d _ && -r _) {
498 # directory
499 if ($path !~ /\/$/) {
500 # create a redirect to get the trailing "/"
501 # we don't try to avoid the :80
502 $self->err (301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
503 } else {
504 $ims < $self->{stat}[9]
505 or $self->err (304, "not modified");
506
507 if (-r "$path/index.html") {
508 # replace directory "size" by index.html filesize
509 $self->{stat} = [stat ($self->{path} .= "/index.html")];
510 $self->handle_file ($queue_index, $tbf_top);
511 } else {
512 $self->handle_dir;
513 }
514 }
515 } elsif (-f _ && -r _) {
516 -x _ and $self->err (403, "forbidden");
517
518 if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
519 my $timeout = $::NOW + 10;
520 while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
521 if ($timeout < $::NOW) {
522 $self->block($::BLOCKTIME, "too many connections");
523 } else {
524 $httpevent->wait;
525 }
526 }
527 }
528
529 $self->handle_file ($queue_file, $tbf_top);
530 } else {
531 $self->err (404, "not found");
532 }
533 }
534 }
535
536 sub handle_dir {
537 my $self = shift;
538 my $idx = $self->diridx;
539
540 $self->response (200, "ok",
541 {
542 "Content-Type" => "text/html; charset=utf-8",
543 "Content-Length" => length $idx,
544 "Last-Modified" => time2str ($self->{stat}[9]),
545 },
546 $idx);
547 }
548
549 sub handle_file {
550 my ($self, $queue, $tbf) = @_;
551 my $length = $self->{stat}[7];
552 my $hdr = {
553 "Last-Modified" => time2str ((stat _)[9]),
554 "Accept-Ranges" => "bytes",
555 };
556
557 my @code = (200, "ok");
558 my ($l, $h);
559
560 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
561 for (split /,/, $1) {
562 if (/^-(\d+)$/) {
563 ($l, $h) = ($length - $1, $length - 1);
564 } elsif (/^(\d+)-(\d*)$/) {
565 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
566 } else {
567 ($l, $h) = (0, $length - 1);
568 goto ignore;
569 }
570 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
571 }
572 $hdr->{"Content-Range"} = "bytes */$length";
573 $hdr->{"Content-Length"} = $length;
574 $self->err (416, "not satisfiable", $hdr, "");
575
576 satisfiable:
577 # check for segmented downloads
578 if ($l && $::NO_SEGMENTED) {
579 my $timeout = $::NOW + 15;
580 while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
581 if ($timeout <= $::NOW) {
582 $self->block ($::BLOCKTIME, "segmented downloads are forbidden");
583 #$self->err_segmented_download;
584 } else {
585 $httpevent->wait;
586 }
587 }
588 }
589
590 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
591 @code = (206, "partial content");
592 $length = $h - $l + 1;
593
594 ignore:
595 } else {
596 ($l, $h) = (0, $length - 1);
597 }
598
599 $self->{path} =~ /\.([^.]+)$/;
600 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
601 $hdr->{"Content-Length"} = $length;
602
603 $self->response (@code, $hdr, "");
604
605 if ($self->{method} eq "GET") {
606 $self->{time} = $::NOW;
607 $self->{written} = 0;
608
609 open my $fh, "<", $self->{path}
610 or die "$self->{path}: late open failure ($!)";
611
612 $h -= $l - 1;
613
614 my $transfer = $queue->start_transfer ($h);
615 my $locked;
616 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
617
618 while ($h > 0) {
619 unless ($locked) {
620 if ($locked ||= $transfer->try ($::WAIT_INTERVAL)) {
621 $bufsize = $::BUFSIZE;
622 $self->{time} = $::NOW;
623 $self->{written} = 0;
624 }
625 }
626
627 if ($blocked{$self->{remote_id}}) {
628 $self->{h}{connection} = "close";
629 die bless {}, err::;
630 }
631
632 Coro::AIO::aio_read $fh, $l, ($h > $bufsize ? $bufsize : $h), my $buf, 0
633 or last;
634
635 $tbf->request (length $buf);
636 my $w = syswrite $self->{fh}, $buf
637 or last;
638 $::written += $w;
639 $self->{written} += $w;
640 $l += $w;
641 }
642
643 close $fh;
644 }
645 }
646
647 1
648