ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/httpd.pl
Revision: 1.22
Committed: Fri Aug 17 04:10:38 2001 UTC (22 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.21: +1 -1 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 use Coro;
2 use Coro::Semaphore;
3 use Coro::Event;
4 use Coro::Socket;
5
6 no utf8;
7 use bytes;
8
9 # at least on my machine, this thingy serves files
10 # quite a bit faster than apache, ;)
11 # and quite a bit slower than thttpd :(
12
13 $SIG{PIPE} = 'IGNORE';
14
15 sub slog {
16 my $level = shift;
17 my $format = shift;
18 printf "---: $format\n", @_;
19 }
20
21 my $connections = new Coro::Semaphore $MAX_CONNECTS;
22
23 my @newcons;
24 my @pool;
25
26 # one "execution thread"
27 sub handler {
28 while () {
29 my $new = pop @newcons;
30 if ($new) {
31 eval {
32 conn->new(@$new)->handle;
33 };
34 slog 1, "$@" if $@ && !ref $@;
35 $connections->up;
36 } else {
37 last if @pool >= $MAX_POOL;
38 push @pool, $Coro::current;
39 schedule;
40 }
41 }
42 }
43
44 my $http_port = new Coro::Socket
45 LocalAddr => $SERVER_HOST,
46 LocalPort => $SERVER_PORT,
47 ReuseAddr => 1,
48 Listen => 50,
49 or die "unable to start server";
50
51 push @listen_sockets, $http_port;
52
53 # the "main thread"
54 async {
55 slog 1, "accepting connections";
56 while () {
57 $connections->down;
58 push @newcons, [$http_port->accept];
59 #slog 3, "accepted @$connections ".scalar(@pool);
60 $::NOW = time;
61 if (@pool) {
62 (pop @pool)->ready;
63 } else {
64 async \&handler;
65 }
66
67 }
68 };
69
70 package conn;
71
72 use Socket;
73 use HTTP::Date;
74 use Convert::Scalar 'weaken';
75 use Linux::AIO;
76
77 Linux::AIO::min_parallel $::AIO_PARALLEL;
78
79 Event->io(fd => Linux::AIO::poll_fileno,
80 poll => 'r', async => 1,
81 cb => \&Linux::AIO::poll_cb);
82 my $scheduler = Event->idle(
83 max => 0, min => 0, prio => 4, parked => 1,
84 cb => \&Coro::schedule);
85
86 our %conn; # $conn{ip}{fh} => connobj
87 our %blocked;
88 our %mimetype;
89
90 sub read_mimetypes {
91 local *M;
92 if (open M, "<mime_types") {
93 while (<M>) {
94 if (/^([^#]\S+)\t+(\S+)$/) {
95 $mimetype{lc $1} = $2;
96 }
97 }
98 } else {
99 print "cannot open mime_types\n";
100 }
101 }
102
103 read_mimetypes;
104
105 sub new {
106 my $class = shift;
107 my $peername = shift;
108 my $fh = shift;
109 my $self = bless { fh => $fh }, $class;
110 my (undef, $iaddr) = unpack_sockaddr_in $peername
111 or $self->err(500, "unable to decode peername");
112
113 $self->{remote_addr} = inet_ntoa $iaddr;
114 $self->{time} = $::NOW;
115
116 # enter ourselves into various lists
117 weaken ($conn{$self->{remote_addr}}{$self*1} = $self);
118
119 $::conns++;
120
121 $self;
122 }
123
124 sub DESTROY {
125 my $self = shift;
126
127 $::conns--;
128
129 $self->eoconn;
130 delete $conn{$self->{remote_addr}}{$self*1};
131 }
132
133 # end of connection
134 sub eoconn {
135 delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1};
136 }
137
138 sub slog {
139 my $self = shift;
140 main::slog($_[0], "$self->{remote_addr}> $_[1]");
141 }
142
143 sub response {
144 my ($self, $code, $msg, $hdr, $content) = @_;
145 my $res = "HTTP/1.1 $code $msg\015\012";
146
147 #$res .= "Connection: close\015\012";
148 $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :(
149
150 while (my ($h, $v) = each %$hdr) {
151 $res .= "$h: $v\015\012"
152 }
153 $res .= "\015\012";
154
155 $res .= $content if defined $content and $self->{method} ne "HEAD";
156
157 print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d#
158
159 $self->{written} +=
160 print {$self->{fh}} $res;
161 }
162
163 sub err {
164 my $self = shift;
165 my ($code, $msg, $hdr, $content) = @_;
166
167 unless (defined $content) {
168 $content = "$code $msg";
169 $hdr->{"Content-Type"} = "text/plain";
170 $hdr->{"Content-Length"} = length $content;
171 }
172 $hdr->{"Connection"} = "close";
173
174 $self->response($code, $msg, $hdr, $content);
175
176 die bless {}, err::;
177 }
178
179 sub err_blocked {
180 my $self = shift;
181 my $ip = $self->{remote_addr};
182 my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME;
183
184 Coro::Event::do_timer(after => 20*rand);
185
186 $self->err(401, "too many connections",
187 {
188 "Content-Type" => "text/html",
189 "Retry-After" => $::BLOCKTIME,
190 "Warning" => "Please do NOT retry, you have been blocked",
191 "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"",
192 },
193 <<EOF);
194 <html><p>
195 You have been blocked because you opened too many connections. You
196 may retry at</p>
197
198 <p><blockquote>$time.</blockquote></p>
199
200 <p>Until then, each new access will renew the block. You might want to have a
201 look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p>
202 </html>
203 EOF
204 }
205
206 sub handle {
207 my $self = shift;
208 my $fh = $self->{fh};
209
210 $fh->timeout($::REQ_TIMEOUT);
211 while() {
212 $self->{reqs}++;
213
214 # read request and parse first line
215 my $req = $fh->readline("\015\012\015\012");
216
217 unless (defined $req) {
218 if (exists $self->{version}) {
219 last;
220 } else {
221 $self->err(408, "request timeout");
222 }
223 }
224
225 $self->{h} = {};
226
227 $fh->timeout($::RES_TIMEOUT);
228 my $ip = $self->{remote_addr};
229
230 if ($blocked{$ip}) {
231 $self->err_blocked($blocked{$ip})
232 if $blocked{$ip} > $::NOW;
233
234 delete $blocked{$ip};
235 }
236
237 if (%{$conn{$ip}} > $::MAX_CONN_IP) {
238 $self->slog(2, "blocked ip $ip");
239 $self->err_blocked;
240 }
241
242 $req =~ /^(?:\015\012)?
243 (GET|HEAD) \040+
244 ([^\040]+) \040+
245 HTTP\/([0-9]+\.[0-9]+)
246 \015\012/gx
247 or $self->err(405, "method not allowed", { Allow => "GET,HEAD" });
248
249 $self->{method} = $1;
250 $self->{uri} = $2;
251 $self->{version} = $3;
252
253 $3 =~ /^1\./
254 or $self->err(506, "http protocol version $3 not supported");
255
256 # parse headers
257 {
258 my (%hdr, $h, $v);
259
260 $hdr{lc $1} .= ",$2"
261 while $req =~ /\G
262 ([^:\000-\040]+):
263 [\008\040]*
264 ((?: [^\015\012]+ | \015\012[\008\040] )*)
265 \015\012
266 /gxc;
267
268 $req =~ /\G\015\012$/
269 or $self->err(400, "bad request");
270
271 $self->{h}{$h} = substr $v, 1
272 while ($h, $v) = each %hdr;
273 }
274
275 $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80;
276
277 weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self);
278
279 $self->map_uri;
280 $self->respond;
281
282 $self->eoconn;
283
284 last if $self->{h}{connection} =~ /close/ || $self->{version} lt "1.1";
285
286 $self->slog(9, "persistent connection [".$self->{h}{"user-agent"}."][$self->{reqs}]");
287 $fh->timeout($::PER_TIMEOUT);
288 }
289 }
290
291 # uri => path mapping
292 sub map_uri {
293 my $self = shift;
294 my $host = $self->{h}{host} || "default";
295 my $uri = $self->{uri};
296
297 # some massaging, also makes it more secure
298 $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge;
299 $uri =~ s%//+%/%g;
300 $uri =~ s%/\.(?=/|$)%%g;
301 1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%;
302
303 $uri =~ m%^/?\.\.(?=/|$)%
304 and $self->err(400, "bad request");
305
306 $self->{name} = $uri;
307
308 # now do the path mapping
309 $self->{path} = "$::DOCROOT/$host$uri";
310
311 $self->access_check;
312 }
313
314 sub server_address {
315 my $self = shift;
316 my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname
317 or $self->err(500, "unable to get socket name");
318 ((inet_ntoa $iaddr), $port);
319 }
320
321 sub server_host {
322 my $self = shift;
323 if (exists $self->{h}{host}) {
324 return $self->{h}{host};
325 } else {
326 return (($self->server_address)[0]);
327 }
328 }
329
330 sub server_hostport {
331 my $self = shift;
332 my ($host, $port);
333 if (exists $self->{h}{host}) {
334 ($host, $port) = ($self->{h}{host}, $self->{server_port});
335 } else {
336 ($host, $port) = $self->server_address;
337 }
338 $port = $port == 80 ? "" : ":$port";
339 $host.$port;
340 }
341
342 sub _cgi {
343 my $self = shift;
344 my $path = shift;
345 my $fh;
346
347 # no two-way xxx supported
348 if (0 == fork) {
349 open STDOUT, ">&".fileno($self->{fh});
350 if (chdir $::DOCROOT) {
351 $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike
352 $ENV{HTTP_HOST} = $self->server_host;
353 $ENV{HTTP_PORT} = $self->{server_host};
354 $ENV{SCRIPT_NAME} = $self->{name};
355 exec $path;
356 }
357 Coro::State::_exit(0);
358 } else {
359 }
360 }
361
362 sub respond {
363 my $self = shift;
364 my $path = $self->{path};
365
366 stat $path
367 or $self->err(404, "not found");
368
369 $self->{stat} = [stat _];
370
371 # idiotic netscape sends idiotic headers AGAIN
372 my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/
373 ? str2time $1 : 0;
374
375 if (-d _ && -r _) {
376 # directory
377 if ($path !~ /\/$/) {
378 # create a redirect to get the trailing "/"
379 my $host = $self->server_hostport;
380 $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" });
381 } else {
382 $ims < $self->{stat}[9]
383 or $self->err(304, "not modified");
384
385 if ($self->{method} eq "GET") {
386 if (-r "$path/index.html") {
387 $self->{path} .= "/index.html";
388 $self->handle_file;
389 } else {
390 $self->handle_dir;
391 }
392 }
393 }
394 } elsif (-f _ && -r _) {
395 -x _ and $self->err(403, "forbidden");
396 $self->handle_file;
397 } else {
398 $self->err(404, "not found");
399 }
400 }
401
402 sub handle_dir {
403 my $self = shift;
404 my $idx = $self->diridx;
405
406 $self->response(200, "ok",
407 {
408 "Content-Type" => "text/html",
409 "Content-Length" => length $idx,
410 },
411 $idx);
412 }
413
414 sub handle_file {
415 my $self = shift;
416 my $length = -s _;
417 my $hdr = {
418 "Last-Modified" => time2str ((stat _)[9]),
419 };
420
421 my @code = (200, "ok");
422 my ($l, $h);
423
424 if ($self->{h}{range} =~ /^bytes=(.*)$/) {
425 for (split /,/, $1) {
426 if (/^-(\d+)$/) {
427 ($l, $h) = ($length - $1, $length - 1);
428 } elsif (/^(\d+)-(\d*)$/) {
429 ($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1);
430 } else {
431 ($l, $h) = (0, $length - 1);
432 goto ignore;
433 }
434 goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l;
435 }
436 $hdr->{"Content-Range"} = "bytes */$length";
437 $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")");
438 $self->err(416, "not satisfiable", $hdr);
439
440 satisfiable:
441 # check for segmented downloads
442 if ($l && $::NO_SEGMENTED) {
443 if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) {
444 Coro::Event::do_timer(after => 15);
445
446 $self->err(400, "segmented downloads are not allowed");
447 }
448 }
449
450 $hdr->{"Content-Range"} = "bytes $l-$h/$length";
451 @code = (206, "partial content");
452 $length = $h - $l + 1;
453
454 ignore:
455 } else {
456 ($l, $h) = (0, $length - 1);
457 }
458
459 $self->{path} =~ /\.([^.]+)$/;
460 $hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream";
461 $hdr->{"Content-Length"} = $length;
462
463 $self->response(@code, $hdr, "");
464
465 if ($self->{method} eq "GET") {
466 my ($fh, $buf, $r);
467 my $current = $Coro::current;
468 open $fh, "<", $self->{path}
469 or die "$self->{path}: late open failure ($!)";
470
471 $h -= $l - 1;
472
473 if (0) {
474 if ($l) {
475 sysseek $fh, $l, 0;
476 }
477 }
478
479 while ($h > 0) {
480 if (0) {
481 sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h
482 or last;
483 } else {
484 aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h),
485 $buf, 0, sub {
486 $r = $_[0];
487 $current->ready;
488 $scheduler->now;
489 });
490 &Coro::schedule;
491 last unless $r;
492 }
493 my $w = $self->{fh}->syswrite($buf)
494 or last;
495 $::written += $w;
496 $self->{written} += $w;
497 $l += $r;
498 }
499 }
500
501 close $fh;
502 }
503
504 1;