ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/cvsroot/Coro/myhttpd/httpd.pl
Revision: 1.47
Committed: Tue Nov 20 01:56:21 2001 UTC (22 years, 7 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.46: +4 -1 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5 use Coro::Signal;
6
7 use HTTP::Date;
8 use POSIX ();
9
10 no utf8;
11 use bytes;
12
13 # at least on my machine, this thingy serves files
14 # quite a bit faster than apache, ;)
15 # and quite a bit slower than thttpd :(
16
17 $SIG{PIPE} = 'IGNORE';
18
19 our $accesslog;
20
21 if ($ACCESS_LOG) {
22 use IO::Handle;
23 open $accesslog, ">>$ACCESS_LOG"
24 or die "$ACCESS_LOG: $!";
25 $accesslog->autoflush(1);
26 }
27
28 sub slog {
29 my $level = shift;
30 my $format = shift;
31 printf "---: $format\n", @_;
32 }
33
34 our $connections = new Coro::Semaphore $MAX_CONNECTS || 250;
35 our $httpevent = new Coro::Signal;
36
37 our $wait_factor = 0.95;
38
39 our @transfers = (
40 [(new Coro::Semaphore $MAX_TRANSFERS_SMALL || 50), 1],
41 [(new Coro::Semaphore $MAX_TRANSFERS_LARGE || 50), 1],
42 );
43
44 my @newcons;
45 my @pool;
46
47 # one "execution thread"
48 sub handler {
49 while () {
50 if (@newcons) {
51 eval {
52 conn->new(@{pop @newcons})->handle;
53 };
54 slog 1, "$@" if $@ && !ref $@;
55 $connections->up;
56 } else {
57 last if @pool >= $MAX_POOL;
58 push @pool, $Coro::current;
59 schedule;
60 }
61 }
62 }
63
64 sub listen_on {
65 my $listen = $_[0];
66
67 push @listen_sockets, $listen;
68
69 # the "main thread"
70 async {
71 slog 1, "accepting connections";
72 while () {
73 $connections->down;
74 push @newcons, [$listen->accept];
75 #slog 3, "accepted @$connections ".scalar(@pool);
76 if (@pool) {
77 (pop @pool)->ready;
78 } else {
79 async \&handler;
80 }
81
82 }
83 };
84 }
85
86 my $http_port = new Coro::Socket
87 LocalAddr => $SERVER_HOST,
88 LocalPort => $SERVER_PORT,
89 ReuseAddr => 1,
90 Listen => 50,
91 or die "unable to start server";
92
93 listen_on $http_port;
94
95 if ($SERVER_PORT2) {
96 my $http_port = new Coro::Socket
97 LocalAddr => $SERVER_HOST,
98 LocalPort => $SERVER_PORT2,
99 ReuseAddr => 1,
100 Listen => 50,
101 or die "unable to start server";
102
103 listen_on $http_port;
104 }
105
106 our $NOW;
107 our $HTTP_NOW;
108
109 Event->timer(interval => 1, hard => 1, cb => sub {
110 $NOW = time;
111 $HTTP_NOW = time2str $NOW;
112 })->now;
113
114 package conn;
115
116 use Socket;
117 use HTTP::Date;
118 use Convert::Scalar 'weaken';
119 use Linux::AIO;
120
121 Linux::AIO::min_parallel $::AIO_PARALLEL;
122
123 Event->io(fd => Linux::AIO::poll_fileno,
124 poll => 'r', async => 1,
125 cb => \&Linux::AIO::poll_cb);
126
127 our %conn; # $conn{ip}{self} => connobj
128 our %uri; # $uri{ip}{uri}{self}
129 our %blocked;
130 our %mimetype;
131
132 sub read_mimetypes {
133 local *M;
134 if (open M, "<mime_types") {
135 while (<M>) {
136 if (/^([^#]\S+)\t+(\S+)$/) {
137 $mimetype{lc $1} = $2;
138 }
139 }
140 } else {
141 print "cannot open mime_types\n";
142 }
143 }
144
145 read_mimetypes;
146
147 sub new {
148 my $class = shift;
149 my $fh = shift;
150 my $peername = shift;
151 my $self = bless { fh => $fh }, $class;
152 my (undef, $iaddr) = unpack_sockaddr_in $peername
153 or $self->err(500, "unable to decode peername");
154
155 $self->{remote_addr} = inet_ntoa $iaddr;
156 $self->{time} = $::NOW;
157
158 $::conns++;
159
160 $self;
161 }
162
163 sub DESTROY {
164 my $self = shift;
165 $::conns--;
166 $self->eoconn;
167 }
168
169 # end of connection
170 sub eoconn {
171 my $self = shift;
172
173 # clean up hints
174 delete $conn{$self->{remote_id}}{$self*1};
175 delete $uri{$self->{remote_id}}{$self->{uri}}{$self*1};
176
177 $httpevent->broadcast;
178 }
179
180 sub slog {
181 my $self = shift;
182 main::slog($_[0], ($self->{remote_id} || $self->{remote_addr}) ."> $_[1]");
183 }
184
185 sub response {
186 my ($self, $code, $msg, $hdr, $content) = @_;
187 my $res = "HTTP/1.1 $code $msg\015\012";
188
189 if (exists $hdr->{Connection}) {
190 if ($hdr->{Connection} =~ /close/) {
191 $self->{h}{connection} = "close"
192 }
193 } else {
194 if ($self->{version} < 1.1) {
195 if ($self->{h}{connection} =~ /keep-alive/i) {
196 $hdr->{Connection} = "Keep-Alive";
197 } else {
198 $self->{h}{connection} = "close"
199 }
200 }
201 }
202
203 $res .= "Date: $HTTP_NOW\015\012";
204
205 while (my ($h, $v) = each %$hdr) {
206 $res .= "$h: $v\015\012"
207 }
208 $res .= "\015\012";
209
210 $res .= $content if defined $content and $self->{method} ne "HEAD";
211
212 my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $NOW).
213 " $self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";
214
215 print $accesslog $log if $accesslog;
216 print STDERR $log;
217
218 $self->{written} +=
219 print {$self->{fh}} $res;
220 }
221
222 sub err {
223 my $self = shift;
224 my ($code, $msg, $hdr, $content) = @_;
225
226 unless (defined $content) {
227 $content = "$code $msg\n";
228 $hdr->{"Content-Type"} = "text/plain";
229 $hdr->{"Content-Length"} = length $content;
230 }
231 $hdr->{"Connection"} = "close";
232
233 $self->response($code, $msg, $hdr, $content);
234
235 die bless {}, err::;
236 }
237
238 sub handle {
239 my $self = shift;
240 my $fh = $self->{fh};
241
242 my $host;
243
244 $fh->timeout($::REQ_TIMEOUT);
245 while() {
246 $self->{reqs}++;
247
248 # read request and parse first line
249 my $req = $fh->readline("\015\012\015\012");
250
251 unless (defined $req) {
252 if (exists $self->{version}) {
253 last;
254 } else {
255 $self->err(408, "request timeout");
256 }
257 }
258
259 $self->{h} = {};
260
261 $fh->timeout($::RES_TIMEOUT);
262
263 $req =~ /^(?:\015\012)?
264 (GET|HEAD) \040+
265 ([^\040]+) \040+
266 HTTP\/([0-9]+\.[0-9]+)
267 \015\012/gx
268 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
269
270 $self->{method} = $1;
271 $self->{uri} = $2;
272 $self->{version} = $3;
273
274 $3 =~ /^1\./
275 or $self->err(506, "http protocol version $3 not supported");
276
277 # parse headers
278 {
279 my (%hdr, $h, $v);
280
281 $hdr{lc $1} .= ",$2"
282 while $req =~ /\G
283 ([^:\000-\040]+):
284 [\008\040]*
285 ((?: [^\015\012]+ | \015\012[\008\040] )*)
286 \015\012
287 /gxc;
288
289 $req =~ /\G\015\012$/
290 or $self->err(400, "bad request");
291
292 $self->{h}{$h} = substr $v, 1
293 while ($h, $v) = each %hdr;
294 }
295
296 # remote id should be unique per user
297 my $id = $self->{remote_addr};
298
299 if (exists $self->{h}{"client-ip"}) {
300 $id .= "[".$self->{h}{"client-ip"}."]";
301 } elsif (exists $self->{h}{"x-forwarded-for"}) {
302 $id .= "[".$self->{h}{"x-forwarded-for"}."]";
303 }
304
305 $self->{remote_id} = $id;
306
307 if ($blocked{$id}) {
308 $self->err_blocked($blocked{$id})
309 if $blocked{$id} > $::NOW;
310
311 delete $blocked{$id};
312 }
313
314 if (%{$conn{$id}} >= $::MAX_CONN_IP) {
315 my $delay = $::PER_TIMEOUT + $::NOW + 15;
316 while (%{$conn{$id}} >= $::MAX_CONN_IP) {
317 if ($delay < $::NOW) {
318 $self->slog(2, "blocked ip $id");
319 $self->err_blocked;
320 } else {
321 $httpevent->wait;
322 }
323 }
324 }
325
326 # find out server name and port
327 if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) {
328 $host = $1;
329 } else {
330 $host = $self->{h}{host};
331 }
332
333 if (defined $host) {
334 $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80;
335 } else {
336 ($self->{server_port}, $host)
337 = unpack_sockaddr_in $self->{fh}->sockname
338 or $self->err(500, "unable to get socket name");
339 $host = inet_ntoa $host;
340 }
341
342 $self->{server_name} = $host;
343
344 # enter ourselves into various lists
345 weaken ($conn{$id}{$self*1} = $self);
346 weaken ($uri{$id}{$self->{uri}}{$self*1} = $self);
347
348 eval {
349 $self->map_uri;
350 $self->respond;
351 };
352
353 $self->eoconn;
354
355 die if $@ && !ref $@;
356
357 last if $self->{h}{connection} =~ /close/;
358
359 $httpevent->broadcast;
360
361 $fh->timeout($::PER_TIMEOUT);
362 }
363 }
364
365 # uri => path mapping
366 sub map_uri {
367 my $self = shift;
368 my $host = $self->{server_name};
369 my $uri = $self->{uri};
370
371 # some massaging, also makes it more secure
372 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
373 $uri =~ s%//+%/%g;
374 $uri =~ s%/\.(?=/|$)%%g;
375 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
376
377 $uri =~ m%^/?\.\.(?=/|$)%
378 and $self->err(400, "bad request");
379
380 $self->{name} = $uri;
381
382 # now do the path mapping
383 $self->{path} = "$::DOCROOT/$host$uri";
384
385 $self->access_check;
386 }
387
388 sub _cgi {
389 my $self = shift;
390 my $path = shift;
391 my $fh;
392
393 # no two-way xxx supported
394 if (0 == fork) {
395 open STDOUT, ">&".fileno($self->{fh});
396 if (chdir $::DOCROOT) {
397 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
398 $ENV{HTTP_HOST} = $self->{server_name};
399 $ENV{HTTP_PORT} = $self->{server_port};
400 $ENV{SCRIPT_NAME} = $self->{name};
401 exec $path;
402 }
403 Coro::State::_exit(0);
404 } else {
405 die;
406 }
407 }
408
409 sub server_hostport {
410 $_[0]{server_port} == 80
411 ? $_[0]{server_name}
412 : "$_[0]{server_name}:$_[0]{server_port}";
413 }
414
415 sub respond {
416 my $self = shift;
417 my $path = $self->{path};
418
419 stat $path
420 or $self->err(404, "not found");
421
422 $self->{stat} = [stat _];
423
424 # idiotic netscape sends idiotic headers AGAIN
425 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
426 ? str2time $1 : 0;
427
428 if (-d _ && -r _) {
429 # directory
430 if ($path !~ /\/$/) {
431 # create a redirect to get the trailing "/"
432 # we don't try to avoid the :80
433 $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" });
434 } else {
435 $ims < $self->{stat}[9]
436 or $self->err(304, "not modified");
437
438 if (-r "$path/index.html") {
439 # replace directory "size" by index.html filesize
440 $self->{stat}[7] = (stat ($self->{path} .= "/index.html"))[7];
441 $self->handle_file;
442 } else {
443 $self->handle_dir;
444 }
445 }
446 } elsif (-f _ && -r _) {
447 -x _ and $self->err(403, "forbidden");
448 $self->handle_file;
449 } else {
450 $self->err(404, "not found");
451 }
452 }
453
454 sub handle_dir {
455 my $self = shift;
456 my $idx = $self->diridx;
457
458 $self->response(200, "ok",
459 {
460 "Content-Type" => "text/html",
461 "Content-Length" => length $idx,
462 "Last-Modified" => time2str ((stat _)[9]),
463 },
464 $idx);
465 }
466
467 sub handle_file {
468 my $self = shift;
469 my $length = $self->{stat}[7];
470 my $queue = $::transfers[$length >= $::TRANSFER_SMALL];
471 my $hdr = {
472 "Last-Modified" => time2str ((stat _)[9]),
473 };
474
475 my @code = (200, "ok");
476 my ($l, $h);
477
478 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
479 for (split /,/, $1) {
480 if (/^-(\d+)$/) {
481 ($l, $h) = ($length - $1, $length - 1);
482 } elsif (/^(\d+)-(\d*)$/) {
483 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
484 } else {
485 ($l, $h) = (0, $length - 1);
486 goto ignore;
487 }
488 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l;
489 }
490 $hdr->{"Content-Range"} = "bytes */$length";
491 $hdr->{"Content-Length"} = $length;
492 $self->err(416, "not satisfiable", $hdr, "");
493
494 satisfiable:
495 # check for segmented downloads
496 if ($l && $::NO_SEGMENTED) {
497 my $delay = $::NOW + $::PER_TIMEOUT + 15;
498 while (%{$uri{$self->{remote_id}}{$self->{uri}}} > 1) {
499 if ($delay <= $::NOW) {
500 $self->err_segmented_download;
501 } else {
502 $httpevent->wait;
503 }
504 }
505 }
506
507 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
508 @code = (206, "partial content");
509 $length = $h - $l + 1;
510
511 ignore:
512 } else {
513 ($l, $h) = (0, $length - 1);
514 }
515
516 $self->{path} =~ /\.([^.]+)$/;
517 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
518 $hdr->{"Content-Length"} = $length;
519
520 $self->response(@code, $hdr, "");
521
522 if ($self->{method} eq "GET") {
523 $self->{time} = $::NOW;
524
525 my $fudge = $queue->[0]->waiters;
526 $fudge = $fudge ? ($fudge+1)/$fudge : 1;
527
528 $queue->[1] *= $fudge;
529 my $transfer = $queue->[0]->guard;
530
531 if ($fudge != 1) {
532 $queue->[1] /= $fudge;
533 $queue->[1] = $queue->[1] * $::wait_factor
534 + ($::NOW - $self->{time}) * (1 - $::wait_factor);
535 }
536 $self->{time} = $::NOW;
537
538 $self->{fh}->writable or return;
539
540 my ($fh, $buf, $r);
541 my $current = $Coro::current;
542 open $fh, "<", $self->{path}
543 or die "$self->{path}: late open failure ($!)";
544
545 $h -= $l - 1;
546
547 if (0) {
548 if ($l) {
549 sysseek $fh, $l, 0;
550 }
551 }
552
553 while ($h > 0) {
554 if (0) {
555 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
556 or last;
557 } else {
558 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
559 $buf, 0, sub {
560 $r = $_[0];
561 Coro::ready($current);
562 });
563 &Coro::schedule;
564 last unless $r;
565 }
566 my $w = syswrite $self->{fh}, $buf
567 or last;
568 $::written += $w;
569 $self->{written} += $w;
570 $l += $r;
571 }
572
573 close $fh;
574 }
575 }
576
577 1;