1 |
use Coro; |
2 |
use Coro::Semaphore; |
3 |
use Coro::Event; |
4 |
use Coro::Socket; |
5 |
|
6 |
no utf8; |
7 |
use bytes; |
8 |
|
9 |
# at least on my machine, this thingy serves files |
10 |
# quite a bit faster than apache, ;) |
11 |
# and quite a bit slower than thttpd :( |
12 |
|
13 |
$SIG{PIPE} = 'IGNORE'; |
14 |
|
15 |
sub slog { |
16 |
my $level = shift; |
17 |
my $format = shift; |
18 |
printf "---: $format\n", @_; |
19 |
} |
20 |
|
21 |
my $connections = new Coro::Semaphore $MAX_CONNECTS; |
22 |
|
23 |
my @newcons; |
24 |
my @pool; |
25 |
|
26 |
# one "execution thread" |
27 |
sub handler { |
28 |
while () { |
29 |
my $new = pop @newcons; |
30 |
if ($new) { |
31 |
eval { |
32 |
conn->new(@$new)->handle; |
33 |
}; |
34 |
slog 1, "$@" if $@ && !ref $@; |
35 |
$connections->up; |
36 |
} else { |
37 |
last if @pool >= $MAX_POOL; |
38 |
push @pool, $Coro::current; |
39 |
schedule; |
40 |
} |
41 |
} |
42 |
} |
43 |
|
44 |
my $http_port = new Coro::Socket |
45 |
LocalAddr => $SERVER_HOST, |
46 |
LocalPort => $SERVER_PORT, |
47 |
ReuseAddr => 1, |
48 |
Listen => 50, |
49 |
or die "unable to start server"; |
50 |
|
51 |
push @listen_sockets, $http_port; |
52 |
|
53 |
# the "main thread" |
54 |
async { |
55 |
slog 1, "accepting connections"; |
56 |
while () { |
57 |
$connections->down; |
58 |
push @newcons, [$http_port->accept]; |
59 |
#slog 3, "accepted @$connections ".scalar(@pool); |
60 |
$::NOW = time; |
61 |
if (@pool) { |
62 |
(pop @pool)->ready; |
63 |
} else { |
64 |
async \&handler; |
65 |
} |
66 |
|
67 |
} |
68 |
}; |
69 |
|
70 |
package conn; |
71 |
|
72 |
use Socket; |
73 |
use HTTP::Date; |
74 |
use Convert::Scalar 'weaken'; |
75 |
|
76 |
our %conn; # $conn{ip}{fh} => connobj |
77 |
our %blocked; |
78 |
our %mimetype; |
79 |
|
80 |
sub read_mimetypes { |
81 |
local *M; |
82 |
if (open M, "<mime_types") { |
83 |
while (<M>) { |
84 |
if (/^([^#]\S+)\t+(\S+)$/) { |
85 |
$mimetype{lc $1} = $2; |
86 |
} |
87 |
} |
88 |
} else { |
89 |
print "cannot open mime_types\n"; |
90 |
} |
91 |
} |
92 |
|
93 |
read_mimetypes; |
94 |
|
95 |
sub new { |
96 |
my $class = shift; |
97 |
my $peername = shift; |
98 |
my $fh = shift; |
99 |
my $self = bless { fh => $fh }, $class; |
100 |
my (undef, $iaddr) = unpack_sockaddr_in $peername |
101 |
or $self->err(500, "unable to decode peername"); |
102 |
|
103 |
$self->{remote_addr} = inet_ntoa $iaddr; |
104 |
$self->{time} = $::NOW; |
105 |
|
106 |
# enter ourselves into various lists |
107 |
weaken ($conn{$self->{remote_addr}}{$self*1} = $self); |
108 |
|
109 |
$::conns++; |
110 |
|
111 |
$self; |
112 |
} |
113 |
|
114 |
sub DESTROY { |
115 |
my $self = shift; |
116 |
|
117 |
$::conns--; |
118 |
|
119 |
delete $conn{$self->{remote_addr}}{$self*1}; |
120 |
delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1}; |
121 |
} |
122 |
|
123 |
sub slog { |
124 |
my $self = shift; |
125 |
main::slog($_[0], "$self->{remote_addr}> $_[1]"); |
126 |
} |
127 |
|
128 |
sub response { |
129 |
my ($self, $code, $msg, $hdr, $content) = @_; |
130 |
my $res = "HTTP/1.0 $code $msg\015\012"; |
131 |
|
132 |
$res .= "Connection: close\015\012"; |
133 |
$res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( |
134 |
|
135 |
while (my ($h, $v) = each %$hdr) { |
136 |
$res .= "$h: $v\015\012" |
137 |
} |
138 |
$res .= "\015\012"; |
139 |
|
140 |
$res .= $content if defined $content and $self->{method} ne "HEAD"; |
141 |
|
142 |
print STDERR "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n";#d# |
143 |
|
144 |
$self->{written} += |
145 |
print {$self->{fh}} $res; |
146 |
} |
147 |
|
148 |
sub err { |
149 |
my $self = shift; |
150 |
my ($code, $msg, $hdr, $content) = @_; |
151 |
|
152 |
unless (defined $content) { |
153 |
$content = "$code $msg"; |
154 |
$hdr->{"Content-Type"} = "text/plain"; |
155 |
$hdr->{"Content-Length"} = length $content; |
156 |
} |
157 |
|
158 |
$self->response($code, $msg, $hdr, $content); |
159 |
|
160 |
die bless {}, err::; |
161 |
} |
162 |
|
163 |
sub err_blocked { |
164 |
my $self = shift; |
165 |
my $ip = $self->{remote_addr}; |
166 |
my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME; |
167 |
|
168 |
Coro::Event::do_timer(after => 15); |
169 |
|
170 |
$self->err(401, "too many connections", |
171 |
{ |
172 |
"Content-Type" => "text/html", |
173 |
"Retry-After" => $::BLOCKTIME |
174 |
}, |
175 |
<<EOF); |
176 |
<html><p> |
177 |
You have been blocked because you opened too many connections. You |
178 |
may retry at</p> |
179 |
|
180 |
<p><blockquote>$time.</blockquote></p> |
181 |
|
182 |
<p>Until then, each new access will renew the block. You might want to have a |
183 |
look at the <a href="http://www.goof.com/pcg/marc/animefaq.html">FAQ</a>.</p> |
184 |
</html> |
185 |
EOF |
186 |
} |
187 |
|
188 |
sub handle { |
189 |
my $self = shift; |
190 |
my $fh = $self->{fh}; |
191 |
|
192 |
#while() { |
193 |
$self->{h} = {}; |
194 |
|
195 |
# read request and parse first line |
196 |
$fh->timeout($::REQ_TIMEOUT); |
197 |
my $req = $fh->readline("\015\012\015\012"); |
198 |
$fh->timeout($::RES_TIMEOUT); |
199 |
|
200 |
defined $req or |
201 |
$self->err(408, "request timeout"); |
202 |
|
203 |
my $ip = $self->{remote_addr}; |
204 |
|
205 |
$self->err_blocked($blocked{$ip}); |
206 |
if ($blocked{$ip}) { |
207 |
$self->err_blocked($blocked{$ip}) |
208 |
if $blocked{$ip} > $::NOW; |
209 |
|
210 |
delete $blocked{$ip}; |
211 |
} |
212 |
|
213 |
if (%{$conn{$ip}} > $::MAX_CONN_IP) { |
214 |
$self->slog(2, "blocked ip $ip"); |
215 |
$self->err_blocked; |
216 |
} |
217 |
|
218 |
$req =~ /^(?:\015\012)? |
219 |
(GET|HEAD) \040+ |
220 |
([^\040]+) \040+ |
221 |
HTTP\/([0-9]+\.[0-9]+) |
222 |
\015\012/gx |
223 |
or $self->err(405, "method not allowed", { Allow => "GET,HEAD" }); |
224 |
|
225 |
$2 ne "1.0" |
226 |
or $self->err(506, "http protocol version not supported"); |
227 |
|
228 |
$self->{method} = $1; |
229 |
$self->{uri} = $2; |
230 |
|
231 |
# parse headers |
232 |
{ |
233 |
my (%hdr, $h, $v); |
234 |
|
235 |
$hdr{lc $1} .= ",$2" |
236 |
while $req =~ /\G |
237 |
([^:\000-\040]+): |
238 |
[\008\040]* |
239 |
((?: [^\015\012]+ | \015\012[\008\040] )*) |
240 |
\015\012 |
241 |
/gxc; |
242 |
|
243 |
$req =~ /\G\015\012$/ |
244 |
or $self->err(400, "bad request"); |
245 |
|
246 |
$self->{h}{$h} = substr $v, 1 |
247 |
while ($h, $v) = each %hdr; |
248 |
} |
249 |
|
250 |
$self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80; |
251 |
|
252 |
weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self); |
253 |
|
254 |
$self->map_uri; |
255 |
$self->respond; |
256 |
#} |
257 |
} |
258 |
|
259 |
# uri => path mapping |
260 |
sub map_uri { |
261 |
my $self = shift; |
262 |
my $host = $self->{h}{host} || "default"; |
263 |
my $uri = $self->{uri}; |
264 |
|
265 |
# some massaging, also makes it more secure |
266 |
$uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; |
267 |
$uri =~ s%//+%/%g; |
268 |
$uri =~ s%/\.(?=/|$)%%g; |
269 |
1 while $uri =~ s%/[^/]+/\.\.(?=/|$)%%; |
270 |
|
271 |
$uri =~ m%^/?\.\.(?=/|$)% |
272 |
and $self->err(400, "bad request"); |
273 |
|
274 |
$self->{name} = $uri; |
275 |
|
276 |
# now do the path mapping |
277 |
$self->{path} = "$::DOCROOT/$host$uri"; |
278 |
|
279 |
$self->access_check; |
280 |
} |
281 |
|
282 |
sub server_address { |
283 |
my $self = shift; |
284 |
my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname |
285 |
or $self->err(500, "unable to get socket name"); |
286 |
((inet_ntoa $iaddr), $port); |
287 |
} |
288 |
|
289 |
sub server_host { |
290 |
my $self = shift; |
291 |
if (exists $self->{h}{host}) { |
292 |
return $self->{h}{host}; |
293 |
} else { |
294 |
return (($self->server_address)[0]); |
295 |
} |
296 |
} |
297 |
|
298 |
sub server_hostport { |
299 |
my $self = shift; |
300 |
my ($host, $port); |
301 |
if (exists $self->{h}{host}) { |
302 |
($host, $port) = ($self->{h}{host}, $self->{server_port}); |
303 |
} else { |
304 |
($host, $port) = $self->server_address; |
305 |
} |
306 |
$port = $port == 80 ? "" : ":$port"; |
307 |
$host.$port; |
308 |
} |
309 |
|
310 |
sub _cgi { |
311 |
my $self = shift; |
312 |
my $path = shift; |
313 |
my $fh; |
314 |
|
315 |
# no two-way xxx supported |
316 |
if (0 == fork) { |
317 |
open STDOUT, ">&".fileno($self->{fh}); |
318 |
if (chdir $::DOCROOT) { |
319 |
$ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike |
320 |
$ENV{HTTP_HOST} = $self->server_host; |
321 |
$ENV{HTTP_PORT} = $self->{server_host}; |
322 |
$ENV{SCRIPT_NAME} = $self->{name}; |
323 |
exec $path; |
324 |
} |
325 |
Coro::State::_exit(0); |
326 |
} else { |
327 |
} |
328 |
} |
329 |
|
330 |
sub respond { |
331 |
my $self = shift; |
332 |
my $path = $self->{path}; |
333 |
|
334 |
stat $path |
335 |
or $self->err(404, "not found"); |
336 |
|
337 |
$self->{stat} = [stat _]; |
338 |
|
339 |
# idiotic netscape sends idiotic headers AGAIN |
340 |
my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
341 |
? str2time $1 : 0; |
342 |
|
343 |
if (-d _ && -r _) { |
344 |
# directory |
345 |
if ($path !~ /\/$/) { |
346 |
# create a redirect to get the trailing "/" |
347 |
my $host = $self->server_hostport; |
348 |
$self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" }); |
349 |
} else { |
350 |
$ims < $self->{stat}[9] |
351 |
or $self->err(304, "not modified"); |
352 |
|
353 |
if ($self->{method} eq "GET") { |
354 |
if (-r "$path/index.html") { |
355 |
$self->{path} .= "/index.html"; |
356 |
$self->handle_file; |
357 |
} else { |
358 |
$self->handle_dir; |
359 |
} |
360 |
} |
361 |
} |
362 |
} elsif (-f _ && -r _) { |
363 |
-x _ and $self->err(403, "forbidden"); |
364 |
$self->handle_file; |
365 |
} else { |
366 |
$self->err(404, "not found"); |
367 |
} |
368 |
} |
369 |
|
370 |
sub handle_dir { |
371 |
my $self = shift; |
372 |
my $idx = $self->diridx; |
373 |
|
374 |
$self->response(200, "ok", |
375 |
{ |
376 |
"Content-Type" => "text/html", |
377 |
"Content-Length" => length $idx, |
378 |
}, |
379 |
$idx); |
380 |
} |
381 |
|
382 |
sub handle_file { |
383 |
my $self = shift; |
384 |
my $length = -s _; |
385 |
my $hdr = { |
386 |
"Last-Modified" => time2str ((stat _)[9]), |
387 |
}; |
388 |
|
389 |
my @code = (200, "ok"); |
390 |
my ($l, $h); |
391 |
|
392 |
if ($self->{h}{range} =~ /^bytes=(.*)$/) { |
393 |
for (split /,/, $1) { |
394 |
if (/^-(\d+)$/) { |
395 |
($l, $h) = ($length - $1, $length - 1); |
396 |
} elsif (/^(\d+)-(\d*)$/) { |
397 |
($l, $h) = ($1, ($2 ne "" || $2 >= $length) ? $2 : $length - 1); |
398 |
} else { |
399 |
($l, $h) = (0, $length - 1); |
400 |
goto ignore; |
401 |
} |
402 |
goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h > $l; |
403 |
} |
404 |
$hdr->{"Content-Range"} = "bytes */$length"; |
405 |
$self->err(416, "not satisfiable", $hdr); |
406 |
|
407 |
satisfiable: |
408 |
# check for segmented downloads |
409 |
if ($l && $::NO_SEGMENTED) { |
410 |
if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) { |
411 |
Coro::Event::do_timer(after => 15); |
412 |
|
413 |
$self->err(400, "segmented downloads are not allowed"); |
414 |
} |
415 |
} |
416 |
|
417 |
$hdr->{"Content-Range"} = "bytes $l-$h/$length"; |
418 |
@code = (206, "partial content"); |
419 |
$length = $h - $l + 1; |
420 |
|
421 |
ignore: |
422 |
} else { |
423 |
($l, $h) = (0, $length - 1); |
424 |
} |
425 |
|
426 |
$self->{path} =~ /\.([^.]+)$/; |
427 |
$hdr->{"Content-Type"} = $mimetype{lc $1} || "application/octet-stream"; |
428 |
$hdr->{"Content-Length"} = $length; |
429 |
|
430 |
$self->response(@code, $hdr, ""); |
431 |
|
432 |
if ($self->{method} eq "GET") { |
433 |
my ($fh, $buf); |
434 |
open $fh, "<", $self->{path} |
435 |
or die "$self->{path}: late open failure ($!)"; |
436 |
|
437 |
if ($l) { |
438 |
sysseek $fh, $l, 0 |
439 |
or die "$self->{path}: cannot seek to $l ($!)"; |
440 |
} |
441 |
|
442 |
$h -= $l - 1; |
443 |
|
444 |
while ($h > 0) { |
445 |
$h -= sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h; |
446 |
my $w = $self->{fh}->syswrite($buf) |
447 |
or last; |
448 |
$::written += $w; |
449 |
$self->{written} += $w; |
450 |
} |
451 |
} |
452 |
|
453 |
close $fh; |
454 |
} |
455 |
|
456 |
1; |