ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.67
Committed: Sun May 19 21:00:47 2002 UTC (22 years, 1 month ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.66: +9 -5 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5 use Coro::Signal;
6
7 use HTTP::Date;
8 use POSIX ();
9
10 use Compress::Zlib ();
11
12 no utf8;
13 use bytes;
14
15 # at least on my machine, this thingy serves files
16 # quite a bit faster than apache, ;)
17 # and quite a bit slower than thttpd :(
18
19 $SIG{PIPE} = 'IGNORE';
20
21 our $accesslog;
22 our $errorlog;
23
24 our $NOW;
25 our $HTTP_NOW;
26
27 Event->timer(interval => 1, hard => 1, cb => sub {
28 $NOW = time;
29 $HTTP_NOW = time2str $NOW;
30 })->now;
31
32 if ($ERROR_LOG) {
33 use IO::Handle;
34 open $errorlog, ">>$ERROR_LOG"
35 or die "$ERROR_LOG: $!";
36 $errorlog->autoflush(1);
37 }
38
39 if ($ACCESS_LOG) {
40 use IO::Handle;
41 open $accesslog, ">>$ACCESS_LOG"
42 or die "$ACCESS_LOG: $!";
43 $accesslog->autoflush(1);
44 }
45
46 sub slog {
47 my $level = shift;
48 my $format = shift;
49 my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW);
50 printf "$NOW: $format\n", @_;
51 printf $errorlog "$NOW: $format\n", @_ if $errorlog;
52 }
53
54 our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
55 our $httpevent = new Coro::Signal;
56
57 our $queue_file = new transferqueue $MAX_TRANSFERS;
58 our $queue_index = new transferqueue 10;
59
60 our $tbf_top = new tbf rate => 200000;
61
62 my @newcons;
63 my @pool;
64
65 # one "execution thread"
66 sub handler {
67 while () {
68 if (@newcons) {
69 eval {
70 conn->new(@{pop @newcons})->handle;
71 };
72 slog 1, "$@" if $@ && !ref $@;
73
74 $httpevent->broadcast; # only for testing, but doesn't matter much
75
76 $connections->up;
77 } else {
78 last if @pool >= $MAX_POOL;
79 push @pool, $Coro::current;
80 schedule;
81 }
82 }
83 }
84
85 sub listen_on {
86 my $listen = $_[0];
87
88 push @listen_sockets, $listen;
89
90 # the "main thread"
91 async {
92 slog 1, "accepting connections";
93 while () {
94 $connections->down;
95 push @newcons, [$listen->accept];
96 #slog 3, "accepted @$connections ".scalar(@pool);
97 if (@pool) {
98 (pop @pool)->ready;
99 } else {
100 async \&handler;
101 }
102
103 }
104 };
105 }
106
107 my $http_port = new Coro::Socket
108 LocalAddr => $SERVER_HOST,
109 LocalPort => $SERVER_PORT,
110 ReuseAddr => 1,
111 Listen => 50,
112 or die "unable to start server";
113
114 listen_on $http_port;
115
116 if ($SERVER_PORT2) {
117 my $http_port = new Coro::Socket
118 LocalAddr => $SERVER_HOST,
119 LocalPort => $SERVER_PORT2,
120 ReuseAddr => 1,
121 Listen => 50,
122 or die "unable to start server";
123
124 listen_on $http_port;
125 }
126
127 package conn;
128
129 use Socket;
130 use HTTP::Date;
131 use Convert::Scalar 'weaken';
132 use Linux::AIO;
133
134 Linux::AIO::min_parallel $::AIO_PARALLEL;
135
136 Event->io(fd => Linux::AIO::poll_fileno,
137 poll => 'r', async => 1,
138 cb => \&Linux::AIO::poll_cb);
139
140 our %conn; # $conn{ip}{self} => connobj
141 our %uri; # $uri{ip}{uri}{self}
142 our %blocked;
143 our %mimetype;
144
145 sub read_mimetypes {
146 local *M;
147 if (open M, "<mime_types") {
148 while (<M>) {
149 if (/^([^#]\S+)\t+(\S+)$/) {
150 $mimetype{lc $1} = $2;
151 }
152 }
153 } else {
154 print "cannot open mime_types\n";
155 }
156 }
157
158 read_mimetypes;
159
160 sub new {
161 my $class = shift;
162 my $fh = shift;
163 my $peername = shift;
164 my $self = bless { fh => $fh }, $class;
165 my (undef, $iaddr) = unpack_sockaddr_in $peername
166 or $self->err(500, "unable to decode peername");
167
168 $self->{remote_addr} =
169 $self->{remote_id} = inet_ntoa $iaddr;
170
171 $self->{time} = $::NOW;
172
173 weaken ($Coro::current->{conn} = $self);
174
175 $::conns++;
176 $::maxconns = $::conns if $::conns > $::maxconns;
177
178 $self;
179 }
180
181 sub DESTROY {
182 #my $self = shift;
183 $::conns--;
184 }
185
186 sub slog {
187 my $self = shift;
188 main::slog($_[0], "$self->{remote_id}> $_[1]");
189 }
190
191 sub response {
192 my ($self, $code, $msg, $hdr, $content) = @_;
193 my $res = "HTTP/1.1 $code $msg\015\012";
194 my $GZ = "";
195
196 if (exists $hdr->{Connection}) {
197 if ($hdr->{Connection} =~ /close/) {
198 $self->{h}{connection} = "close"
199 }
200 } else {
201 if ($self->{version} < 1.1) {
202 if ($self->{h}{connection} =~ /keep-alive/i) {
203 $hdr->{Connection} = "Keep-Alive";
204 } else {
205 $self->{h}{connection} = "close"
206 }
207 }
208 }
209
210 if ($self->{method} ne "HEAD"
211 && $self->{h}{"accept-encoding"} =~ /\bgzip\b/
212 && 400 < length $content
213 && $hdr->{"Content-Length"} == length $content
214 && !exists $hdr->{"Content-Encoding"}
215 ) {
216 my $orig = length $content;
217 $hdr->{"Content-Encoding"} = "gzip";
218 $content = Compress::Zlib::memGzip(\$content);
219 $hdr->{"Content-Length"} = length $content;
220 $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig);
221 }
222
223 $res .= "Date: $HTTP_NOW\015\012";
224
225 while (my ($h, $v) = each %$hdr) {
226 $res .= "$h: $v\015\012"
227 }
228 $res .= "\015\012";
229
230 $res .= $content if defined $content and $self->{method} ne "HEAD";
231
232 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW).
233 " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ.
234 " \"$self->{h}{referer}\"\n";
235
236 print $::accesslog $log if $::accesslog;
237 print STDERR $log;
238
239 $tbf_top->request(length $res, 1e6);
240 $self->{written} += print {$self->{fh}} $res;
241 }
242
243 sub err {
244 my $self = shift;
245 my ($code, $msg, $hdr, $content) = @_;
246
247 unless (defined $content) {
248 $content = "$code $msg\n";
249 $hdr->{"Content-Type"} = "text/plain";
250 $hdr->{"Content-Length"} = length $content;
251 }
252 $hdr->{"Connection"} = "close";
253
254 $self->response($code, $msg, $hdr, $content);
255
256 die bless {}, err::;
257 }
258
259 sub handle {
260 my $self = shift;
261 my $fh = $self->{fh};
262
263 my $host;
264
265 $fh->timeout($::REQ_TIMEOUT);
266 while() {
267 $self->{reqs}++;
268
269 # read request and parse first line
270 my $req = $fh->readline("\015\012\015\012");
271
272 unless (defined $req) {
273 if (exists $self->{version}) {
274 last;
275 } else {
276 $self->err(408, "request timeout");
277 }
278 }
279
280 $self->{h} = {};
281
282 $fh->timeout($::RES_TIMEOUT);
283
284 $req =~ /^(?:\015\012)?
285 (GET|HEAD) \040+
286 ([^\040]+) \040+
287 HTTP\/([0-9]+\.[0-9]+)
288 \015\012/gx
289 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
290
291 $self->{method} = $1;
292 $self->{uri} = $2;
293 $self->{version} = $3;
294
295 $3 =~ /^1\./
296 or $self->err(506, "http protocol version $3 not supported");
297
298 # parse headers
299 {
300 my (%hdr, $h, $v);
301
302 $hdr{lc $1} .= ",$2"
303 while $req =~ /\G
304 ([^:\000-\040]+):
305 [\011\040]*
306 ((?: [^\015\012]+ | \015\012[\011\040] )*)
307 \015\012
308 /gxc;
309
310 $req =~ /\G\015\012$/
311 or $self->err(400, "bad request");
312
313 $self->{h}{$h} = substr $v, 1
314 while ($h, $v) = each %hdr;
315 }
316
317 # remote id should be unique per user
318 my $id = $self->{remote_addr};
319
320 if (exists $self->{h}{"client-ip"}) {
321 $id .= "[".$self->{h}{"client-ip"}."]";
322 } elsif (exists $self->{h}{"x-forwarded-for"}) {
323 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
324 }
325
326 $self->{remote_id} = $id;
327
328 weaken (local $conn{$id}{$self*1} = $self);
329
330 if ($blocked{$id}) {
331 $self->err_blocked
332 if $blocked{$id}[0] > $::NOW;
333
334 delete $blocked{$id};
335 }
336
337 # find out server name and port
338 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
339 $host = $1;
340 } else {
341 $host = $self->{h}{host};
342 }
343
344 if (defined $host) {
345 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
346 } else {
347 ($self->{server_port}, $host)
348 = unpack_sockaddr_in $self->{fh}->sockname
349 or $self->err(500, "unable to get socket name");
350 $host = inet_ntoa $host;
351 }
352
353 $self->{server_name} = $host;
354
355 weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self);
356
357 eval {
358 $self->map_uri;
359 $self->respond;
360 };
361
362 die if $@ && !ref $@;
363
364 last if $self->{h}{connection} =~ /close/i;
365
366 $httpevent->broadcast;
367
368 $fh->timeout($::PER_TIMEOUT);
369 }
370 }
371
372 sub block {
373 my $self = shift;
374
375 $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]];
376 $self->slog(2, "blocked ip $self->{remote_id}");
377 $self->err_blocked;
378 }
379
380 # uri => path mapping
381 sub map_uri {
382 my $self = shift;
383 my $host = $self->{server_name};
384 my $uri = $self->{uri};
385
386 # some massaging, also makes it more secure
387 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
388 $uri =~ s%//+%/%g;
389 $uri =~ s%/\.(?=/|$)%%g;
390 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
391
392 $uri =~ m%^/?\.\.(?=/|$)%
393 and $self->err(400, "bad request");
394
395 $self->{name} = $uri;
396
397 # now do the path mapping
398 $self->{path} = "$::DOCROOT/$host$uri";
399
400 $self->access_check;
401 }
402
403 sub _cgi {
404 my $self = shift;
405 my $path = shift;
406 my $fh;
407
408 # no two-way xxx supported
409 if (0 == fork) {
410 open STDOUT, ">&".fileno($self->{fh});
411 if (chdir $::DOCROOT) {
412 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
413 $ENV{HTTP_HOST} = $self->{server_name};
414 $ENV{HTTP_PORT} = $self->{server_port};
415 $ENV{SCRIPT_NAME} = $self->{name};
416 exec $path;
417 }
418 Coro::State::_exit(0);
419 } else {
420 die;
421 }
422 }
423
424 sub server_hostport {
425 $_[0]{server_port} == 80
426 ? $_[0]{server_name}
427 : "$_[0]{server_name}:$_[0]{server_port}";
428 }
429
430 sub respond {
431 my $self = shift;
432 my $path = $self->{path};
433
434 if ($self->{name} =~ s%^/internal/([^/]+)%%) {
435 if ($::internal{$1}) {
436 $::internal{$1}->($self);
437 } else {
438 $self->err(404, "not found");
439 }
440 } else {
441
442 stat $path
443 or $self->err(404, "not found");
444
445 $self->{stat} = [stat _];
446
447 # idiotic netscape sends idiotic headers AGAIN
448 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
449 ? str2time $1 : 0;
450
451 if (-d _ && -r _) {
452 # directory
453 if ($path !~ /\/$/) {
454 # create a redirect to get the trailing "/"
455 # we don't try to avoid the :80
456 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
457 } else {
458 $ims < $self->{stat}[9]
459 or $self->err(304, "not modified");
460
461 if (-r "$path/index.html") {
462 # replace directory "size" by index.html filesize
463 $self->{stat} = [stat ($self->{path} .= "/index.html")];
464 $self->handle_file($queue_index, $tbf_top);
465 } else {
466 $self->handle_dir;
467 }
468 }
469 } elsif (-f _ && -r _) {
470 -x _ and $self->err(403, "forbidden");
471
472 if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
473 my $timeout = $::NOW + 10;
474 while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) {
475 if ($timeout < $::NOW) {
476 $self->block($::BLOCKTIME, "too many connections");
477 } else {
478 $httpevent->wait;
479 }
480 }
481 }
482
483 $self->handle_file($queue_file, $tbf_top);
484 } else {
485 $self->err(404, "not found");
486 }
487 }
488 }
489
490 sub handle_dir {
491 my $self = shift;
492 my $idx = $self->diridx;
493
494 $self->response(200, "ok",
495 {
496 "Content-Type" => "text/html",
497 "Content-Length" => length $idx,
498 "Last-Modified" => time2str ($self->{stat}[9]),
499 },
500 $idx);
501 }
502
503 sub handle_file {
504 my ($self, $queue, $tbf) = @_;
505 my $length = $self->{stat}[7];
506 my $hdr = {
507 "Last-Modified" => time2str ((stat _)[9]),
508 };
509
510 my @code = (200, "ok");
511 my ($l, $h);
512
513 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
514 for (split /,/, $1) {
515 if (/^-(\d+)$/) {
516 ($l, $h) = ($length - $1, $length - 1);
517 } elsif (/^(\d+)-(\d*)$/) {
518 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
519 } else {
520 ($l, $h) = (0, $length - 1);
521 goto ignore;
522 }
523 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
524 }
525 $hdr->{"Content-Range"} = "bytes */$length";
526 $hdr->{"Content-Length"} = $length;
527 $self->err(416, "not satisfiable", $hdr, "");
528
529 satisfiable:
530 # check for segmented downloads
531 if ($l && $::NO_SEGMENTED) {
532 my $timeout = $::NOW + 15;
533 while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
534 if ($timeout <= $::NOW) {
535 $self->block($::BLOCKTIME, "segmented downloads are forbidden");
536 #$self->err_segmented_download;
537 } else {
538 $httpevent->wait;
539 }
540 }
541 }
542
543 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
544 @code = (206, "partial content");
545 $length = $h - $l + 1;
546
547 ignore:
548 } else {
549 ($l, $h) = (0, $length - 1);
550 }
551
552 $self->{path} =~ /\.([^.]+)$/;
553 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
554 $hdr->{"Content-Length"} = $length;
555
556 $self->response(@code, $hdr, "");
557
558 if ($self->{method} eq "GET") {
559 $self->{time} = $::NOW;
560
561 my $current = $Coro::current;
562
563 my ($fh, $buf, $r);
564
565 open $fh, "<", $self->{path}
566 or die "$self->{path}: late open failure ($!)";
567
568 $h -= $l - 1;
569
570 if (0) { # !AIO
571 if ($l) {
572 sysseek $fh, $l, 0;
573 }
574 }
575
576 my $transfer = $queue->start_transfer($h);
577 my $locked;
578 my $bufsize = $::WAIT_BUFSIZE; # initial buffer size
579
580 while ($h > 0) {
581 unless ($locked) {
582 if ($locked ||= $transfer->try($::WAIT_INTERVAL)) {
583 $bufsize = $::BUFSIZE;
584 $self->{time} = $::NOW;
585 }
586 }
587
588 if ($blocked{$self->{remote_id}}) {
589 $self->{h}{connection} = "close";
590 die bless {}, err::;
591 }
592
593 if (0) { # !AIO
594 sysread $fh, $buf, $h > $bufsize ? $bufsize : $h
595 or last;
596 } else {
597 aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h),
598 $buf, 0, sub {
599 $r = $_[0];
600 Coro::ready($current);
601 });
602 &Coro::schedule;
603 last unless $r;
604 }
605
606 $tbf->request(length $buf);
607 my $w = syswrite $self->{fh}, $buf
608 or last;
609 $::written += $w;
610 $self->{written} += $w;
611 $l += $r;
612 }
613
614 close $fh;
615 }
616 }
617
618 1;