1 | use Coro; |
1 | use Coro; |
2 | use Coro::Semaphore; |
2 | use Coro::Semaphore; |
3 | use Coro::Event; |
3 | use Coro::Event; |
4 | use Coro::Socket; |
4 | use Coro::Socket; |
|
|
5 | use Coro::Signal; |
|
|
6 | |
|
|
7 | use HTTP::Date; |
|
|
8 | use POSIX (); |
|
|
9 | |
|
|
10 | use Compress::Zlib (); |
5 | |
11 | |
6 | no utf8; |
12 | no utf8; |
7 | use bytes; |
13 | use bytes; |
8 | |
14 | |
9 | # at least on my machine, this thingy serves files |
15 | # at least on my machine, this thingy serves files |
… | |
… | |
11 | # and quite a bit slower than thttpd :( |
17 | # and quite a bit slower than thttpd :( |
12 | |
18 | |
13 | $SIG{PIPE} = 'IGNORE'; |
19 | $SIG{PIPE} = 'IGNORE'; |
14 | |
20 | |
15 | our $accesslog; |
21 | our $accesslog; |
|
|
22 | our $errorlog; |
|
|
23 | |
|
|
24 | our $NOW; |
|
|
25 | our $HTTP_NOW; |
|
|
26 | |
|
|
27 | Event->timer(interval => 1, hard => 1, cb => sub { |
|
|
28 | $NOW = time; |
|
|
29 | $HTTP_NOW = time2str $NOW; |
|
|
30 | })->now; |
|
|
31 | |
|
|
32 | if ($ERROR_LOG) { |
|
|
33 | use IO::Handle; |
|
|
34 | open $errorlog, ">>$ERROR_LOG" |
|
|
35 | or die "$ERROR_LOG: $!"; |
|
|
36 | $errorlog->autoflush(1); |
|
|
37 | } |
16 | |
38 | |
17 | if ($ACCESS_LOG) { |
39 | if ($ACCESS_LOG) { |
18 | use IO::Handle; |
40 | use IO::Handle; |
19 | open $accesslog, ">>$ACCESS_LOG" |
41 | open $accesslog, ">>$ACCESS_LOG" |
20 | or die "$ACCESS_LOG: $!"; |
42 | or die "$ACCESS_LOG: $!"; |
… | |
… | |
22 | } |
44 | } |
23 | |
45 | |
24 | sub slog { |
46 | sub slog { |
25 | my $level = shift; |
47 | my $level = shift; |
26 | my $format = shift; |
48 | my $format = shift; |
|
|
49 | my $NOW = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW); |
27 | printf "---: $format\n", @_; |
50 | printf "$NOW: $format\n", @_; |
|
|
51 | printf $errorlog "$NOW: $format\n", @_ if $errorlog; |
28 | } |
52 | } |
29 | |
53 | |
30 | my $connections = new Coro::Semaphore $MAX_CONNECTS; |
54 | our $connections = new Coro::Semaphore $MAX_CONNECTS || 250; |
|
|
55 | our $httpevent = new Coro::Signal; |
|
|
56 | |
|
|
57 | our $queue_file = new transferqueue $MAX_TRANSFERS; |
|
|
58 | our $queue_index = new transferqueue 10; |
|
|
59 | |
|
|
60 | our $tbf_top = new tbf rate => $TBF_RATE || 100000; |
|
|
61 | |
|
|
62 | my $unused_bytes = 0; |
|
|
63 | my $unused_last = time; |
|
|
64 | |
|
|
65 | sub unused_bandwidth { |
|
|
66 | $unused_bytes += $_[0]; |
|
|
67 | if ($unused_last < $NOW - 30 && $unused_bytes / ($NOW - $unused_last) > 50000) { |
|
|
68 | $unused_last = $NOW; |
|
|
69 | $unused_bytes = 0; |
|
|
70 | $queue_file->force_wake_next; |
|
|
71 | slog 1, "forced filetransfer due to unused bandwidth"; |
|
|
72 | } |
|
|
73 | } |
31 | |
74 | |
32 | my @newcons; |
75 | my @newcons; |
33 | my @pool; |
76 | my @pool; |
34 | |
77 | |
35 | # one "execution thread" |
78 | # one "execution thread" |
36 | sub handler { |
79 | sub handler { |
37 | while () { |
80 | while () { |
38 | my $new = pop @newcons; |
|
|
39 | if ($new) { |
81 | if (@newcons) { |
40 | eval { |
82 | eval { |
41 | conn->new(@$new)->handle; |
83 | conn->new(@{pop @newcons})->handle; |
42 | }; |
84 | }; |
43 | slog 1, "$@" if $@ && !ref $@; |
85 | slog 1, "$@" if $@ && !ref $@; |
|
|
86 | |
|
|
87 | $httpevent->broadcast; # only for testing, but doesn't matter much |
|
|
88 | |
44 | $connections->up; |
89 | $connections->up; |
45 | } else { |
90 | } else { |
46 | last if @pool >= $MAX_POOL; |
91 | last if @pool >= $MAX_POOL; |
47 | push @pool, $Coro::current; |
92 | push @pool, $Coro::current; |
48 | schedule; |
93 | schedule; |
49 | } |
94 | } |
50 | } |
95 | } |
|
|
96 | } |
|
|
97 | |
|
|
98 | sub listen_on { |
|
|
99 | my $listen = $_[0]; |
|
|
100 | |
|
|
101 | push @listen_sockets, $listen; |
|
|
102 | |
|
|
103 | # the "main thread" |
|
|
104 | async { |
|
|
105 | slog 1, "accepting connections"; |
|
|
106 | while () { |
|
|
107 | $connections->down; |
|
|
108 | push @newcons, [$listen->accept]; |
|
|
109 | #slog 3, "accepted @$connections ".scalar(@pool); |
|
|
110 | if (@pool) { |
|
|
111 | (pop @pool)->ready; |
|
|
112 | } else { |
|
|
113 | async \&handler; |
|
|
114 | } |
|
|
115 | } |
|
|
116 | }; |
51 | } |
117 | } |
52 | |
118 | |
53 | my $http_port = new Coro::Socket |
119 | my $http_port = new Coro::Socket |
54 | LocalAddr => $SERVER_HOST, |
120 | LocalAddr => $SERVER_HOST, |
55 | LocalPort => $SERVER_PORT, |
121 | LocalPort => $SERVER_PORT, |
56 | ReuseAddr => 1, |
122 | ReuseAddr => 1, |
57 | Listen => 50, |
123 | Listen => 50, |
58 | or die "unable to start server"; |
124 | or die "unable to start server"; |
59 | |
125 | |
60 | push @listen_sockets, $http_port; |
126 | listen_on $http_port; |
61 | |
127 | |
62 | # the "main thread" |
128 | if ($SERVER_PORT2) { |
63 | async { |
129 | my $http_port = new Coro::Socket |
64 | slog 1, "accepting connections"; |
130 | LocalAddr => $SERVER_HOST, |
65 | while () { |
131 | LocalPort => $SERVER_PORT2, |
66 | $connections->down; |
132 | ReuseAddr => 1, |
67 | push @newcons, [$http_port->accept]; |
133 | Listen => 50, |
68 | #slog 3, "accepted @$connections ".scalar(@pool); |
134 | or die "unable to start server"; |
69 | $::NOW = time; |
|
|
70 | if (@pool) { |
|
|
71 | (pop @pool)->ready; |
|
|
72 | } else { |
|
|
73 | async \&handler; |
|
|
74 | } |
|
|
75 | |
135 | |
76 | } |
136 | listen_on $http_port; |
77 | }; |
137 | } |
78 | |
138 | |
79 | package conn; |
139 | package conn; |
80 | |
140 | |
81 | use Socket; |
141 | use Socket; |
82 | use HTTP::Date; |
142 | use HTTP::Date; |
83 | use Convert::Scalar 'weaken'; |
143 | use Convert::Scalar 'weaken'; |
84 | use Linux::AIO; |
144 | use IO::AIO; |
85 | |
145 | |
86 | Linux::AIO::min_parallel $::AIO_PARALLEL; |
146 | IO::AIO::min_parallel $::AIO_PARALLEL; |
87 | |
147 | |
88 | Event->io(fd => Linux::AIO::poll_fileno, |
148 | Event->io(fd => IO::AIO::poll_fileno, |
89 | poll => 'r', async => 1, |
149 | poll => 'r', async => 1, |
90 | cb => \&Linux::AIO::poll_cb); |
150 | cb => \&IO::AIO::poll_cb); |
91 | |
151 | |
92 | our %conn; # $conn{ip}{self} => connobj |
152 | our %conn; # $conn{ip}{self} => connobj |
93 | our %uri; # $uri{ip}{uri}{self} |
153 | our %uri; # $uri{ip}{uri}{self} |
94 | our %blocked; |
154 | our %blocked; |
95 | our %mimetype; |
155 | our %mimetype; |
… | |
… | |
109 | |
169 | |
110 | read_mimetypes; |
170 | read_mimetypes; |
111 | |
171 | |
112 | sub new { |
172 | sub new { |
113 | my $class = shift; |
173 | my $class = shift; |
|
|
174 | my $fh = shift; |
114 | my $peername = shift; |
175 | my $peername = shift; |
115 | my $fh = shift; |
|
|
116 | my $self = bless { fh => $fh }, $class; |
176 | my $self = bless { fh => $fh }, $class; |
117 | my (undef, $iaddr) = unpack_sockaddr_in $peername |
177 | my (undef, $iaddr) = unpack_sockaddr_in $peername |
118 | or $self->err(500, "unable to decode peername"); |
178 | or $self->err(500, "unable to decode peername"); |
119 | |
179 | |
|
|
180 | $self->{remote_addr} = |
120 | $self->{remote_addr} = inet_ntoa $iaddr; |
181 | $self->{remote_id} = inet_ntoa $iaddr; |
|
|
182 | |
121 | $self->{time} = $::NOW; |
183 | $self->{time} = $::NOW; |
122 | |
184 | |
123 | # enter ourselves into various lists |
185 | weaken ($Coro::current->{conn} = $self); |
124 | weaken ($conn{$self->{remote_addr}}{$self*1} = $self); |
|
|
125 | |
186 | |
126 | $::conns++; |
187 | $::conns++; |
|
|
188 | $::maxconns = $::conns if $::conns > $::maxconns; |
127 | |
189 | |
128 | $self; |
190 | $self; |
129 | } |
191 | } |
130 | |
192 | |
131 | sub DESTROY { |
193 | sub DESTROY { |
132 | my $self = shift; |
194 | #my $self = shift; |
133 | |
|
|
134 | $::conns--; |
195 | $::conns--; |
135 | |
|
|
136 | $self->eoconn; |
|
|
137 | delete $conn{$self->{remote_addr}}{$self*1}; |
|
|
138 | } |
196 | } |
139 | |
197 | |
140 | # end of connection |
198 | sub prune_cache { |
141 | sub eoconn { |
199 | my $hash = $_[0]; |
142 | my $self = shift; |
200 | |
143 | delete $uri{$self->{remote_addr}}{$self->{uri}}{$self*1}; |
201 | for (keys %$hash) { |
|
|
202 | if (ref $hash->{$_} eq HASH::) { |
|
|
203 | prune_cache($hash->{$_}); |
|
|
204 | unless (scalar keys %{$hash->{$_}}) { |
|
|
205 | delete $hash->{$_}; |
|
|
206 | $d2++; |
|
|
207 | } |
|
|
208 | } |
|
|
209 | } |
144 | } |
210 | } |
|
|
211 | |
|
|
212 | sub prune_caches { |
|
|
213 | prune_cache \%conn; |
|
|
214 | prune_cache \%uri; |
|
|
215 | |
|
|
216 | for (keys %blocked) { |
|
|
217 | delete $blocked{$_} unless $blocked{$_}[0] > $::NOW; |
|
|
218 | } |
|
|
219 | } |
|
|
220 | |
|
|
221 | Event->timer(interval => 60, cb => \&prune_caches); |
145 | |
222 | |
146 | sub slog { |
223 | sub slog { |
147 | my $self = shift; |
224 | my $self = shift; |
148 | main::slog($_[0], "$self->{remote_addr}> $_[1]"); |
225 | main::slog($_[0], "$self->{remote_id}> $_[1]"); |
149 | } |
226 | } |
150 | |
227 | |
151 | sub response { |
228 | sub response { |
152 | my ($self, $code, $msg, $hdr, $content) = @_; |
229 | my ($self, $code, $msg, $hdr, $content) = @_; |
153 | my $res = "HTTP/1.1 $code $msg\015\012"; |
230 | my $res = "HTTP/1.1 $code $msg\015\012"; |
|
|
231 | my $GZ = ""; |
154 | |
232 | |
155 | $self->{h}{connection} ||= $hdr->{Connection}; |
233 | if (exists $hdr->{Connection}) { |
|
|
234 | if ($hdr->{Connection} =~ /close/) { |
|
|
235 | $self->{h}{connection} = "close" |
|
|
236 | } |
|
|
237 | } else { |
|
|
238 | if ($self->{version} < 1.1) { |
|
|
239 | if ($self->{h}{connection} =~ /keep-alive/i) { |
|
|
240 | $hdr->{Connection} = "Keep-Alive"; |
|
|
241 | } else { |
|
|
242 | $self->{h}{connection} = "close" |
|
|
243 | } |
|
|
244 | } |
|
|
245 | } |
156 | |
246 | |
157 | $res .= "Date: ".(time2str $::NOW)."\015\012"; # slow? nah. :( |
247 | if ($self->{method} ne "HEAD" |
|
|
248 | && $self->{h}{"accept-encoding"} =~ /\bgzip\b/ |
|
|
249 | && 400 < length $content |
|
|
250 | && $hdr->{"Content-Length"} == length $content |
|
|
251 | && !exists $hdr->{"Content-Encoding"} |
|
|
252 | ) { |
|
|
253 | my $orig = length $content; |
|
|
254 | $hdr->{"Content-Encoding"} = "gzip"; |
|
|
255 | $content = Compress::Zlib::memGzip(\$content); |
|
|
256 | $hdr->{"Content-Length"} = length $content; |
|
|
257 | $GZ = sprintf "GZ%02d", 100 - 100*((length $content) / $orig); |
|
|
258 | } |
|
|
259 | |
|
|
260 | $res .= "Date: $HTTP_NOW\015\012"; |
|
|
261 | $res .= "Server: $::NAME\015\012"; |
158 | |
262 | |
159 | while (my ($h, $v) = each %$hdr) { |
263 | while (my ($h, $v) = each %$hdr) { |
160 | $res .= "$h: $v\015\012" |
264 | $res .= "$h: $v\015\012" |
161 | } |
265 | } |
162 | $res .= "\015\012"; |
266 | $res .= "\015\012"; |
163 | |
267 | |
164 | $res .= $content if defined $content and $self->{method} ne "HEAD"; |
268 | $res .= $content if defined $content and $self->{method} ne "HEAD"; |
165 | |
269 | |
166 | my $log = "$self->{remote_addr} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}." \"$self->{h}{referer}\"\n"; |
270 | my $log = (POSIX::strftime "%Y-%m-%d %H:%M:%S", gmtime $::NOW). |
|
|
271 | " $self->{remote_id} \"$self->{uri}\" $code ".$hdr->{"Content-Length"}.$GZ. |
|
|
272 | " \"$self->{h}{referer}\"\n"; |
167 | |
273 | |
168 | print $accesslog $log if $accesslog; |
274 | print $::accesslog $log if $::accesslog; |
169 | print STDERR $log; |
275 | print STDERR $log; |
170 | |
276 | |
171 | $self->{written} += |
277 | $tbf_top->request(length $res, 1e6); |
172 | print {$self->{fh}} $res; |
278 | $self->{written} += print {$self->{fh}} $res; |
173 | } |
279 | } |
174 | |
280 | |
175 | sub err { |
281 | sub err { |
176 | my $self = shift; |
282 | my $self = shift; |
177 | my ($code, $msg, $hdr, $content) = @_; |
283 | my ($code, $msg, $hdr, $content) = @_; |
178 | |
284 | |
179 | unless (defined $content) { |
285 | unless (defined $content) { |
180 | $content = "$code $msg"; |
286 | $content = "$code $msg\n"; |
181 | $hdr->{"Content-Type"} = "text/plain"; |
287 | $hdr->{"Content-Type"} = "text/plain"; |
182 | $hdr->{"Content-Length"} = length $content; |
288 | $hdr->{"Content-Length"} = length $content; |
183 | } |
289 | } |
184 | $hdr->{"Connection"} = "close"; |
290 | $hdr->{"Connection"} = "close"; |
185 | |
291 | |
186 | $self->response($code, $msg, $hdr, $content); |
292 | $self->response($code, $msg, $hdr, $content); |
187 | |
293 | |
188 | die bless {}, err::; |
294 | die bless {}, err::; |
189 | } |
295 | } |
190 | |
296 | |
191 | sub err_blocked { |
|
|
192 | my $self = shift; |
|
|
193 | my $ip = $self->{remote_addr}; |
|
|
194 | my $time = time2str $blocked{$ip} = $::NOW + $::BLOCKTIME; |
|
|
195 | |
|
|
196 | Coro::Event::do_timer(after => 20*rand); |
|
|
197 | |
|
|
198 | $self->err(401, "too many connections", |
|
|
199 | { |
|
|
200 | "Content-Type" => "text/html", |
|
|
201 | "Retry-After" => $::BLOCKTIME, |
|
|
202 | "Warning" => "Please do NOT retry, you have been blocked", |
|
|
203 | "WWW-Authenticate" => "Basic realm=\"Please do NOT retry, you have been blocked\"", |
|
|
204 | "Connection" => "close", |
|
|
205 | }, |
|
|
206 | <<EOF); |
|
|
207 | <html> |
|
|
208 | <head> |
|
|
209 | <title>Too many connections</title> |
|
|
210 | </head> |
|
|
211 | <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000"> |
|
|
212 | |
|
|
213 | <p>You have been blocked because you opened too many connections. You |
|
|
214 | may retry at</p> |
|
|
215 | |
|
|
216 | <p><blockquote>$time.</blockquote></p> |
|
|
217 | |
|
|
218 | <p>Until then, each new access will renew the block. You might want to have a |
|
|
219 | look at the <a href="http://www.goof.com/pcg/marc/animefaq.html#connectionlimit">FAQ</a>.</p> |
|
|
220 | |
|
|
221 | </body></html> |
|
|
222 | EOF |
|
|
223 | } |
|
|
224 | |
|
|
225 | sub handle { |
297 | sub handle { |
226 | my $self = shift; |
298 | my $self = shift; |
227 | my $fh = $self->{fh}; |
299 | my $fh = $self->{fh}; |
|
|
300 | |
|
|
301 | my $host; |
228 | |
302 | |
229 | $fh->timeout($::REQ_TIMEOUT); |
303 | $fh->timeout($::REQ_TIMEOUT); |
230 | while() { |
304 | while() { |
231 | $self->{reqs}++; |
305 | $self->{reqs}++; |
232 | |
306 | |
… | |
… | |
242 | } |
316 | } |
243 | |
317 | |
244 | $self->{h} = {}; |
318 | $self->{h} = {}; |
245 | |
319 | |
246 | $fh->timeout($::RES_TIMEOUT); |
320 | $fh->timeout($::RES_TIMEOUT); |
247 | my $ip = $self->{remote_addr}; |
|
|
248 | |
|
|
249 | if ($blocked{$ip}) { |
|
|
250 | $self->err_blocked($blocked{$ip}) |
|
|
251 | if $blocked{$ip} > $::NOW; |
|
|
252 | |
|
|
253 | delete $blocked{$ip}; |
|
|
254 | } |
|
|
255 | |
|
|
256 | if (%{$conn{$ip}} > $::MAX_CONN_IP) { |
|
|
257 | $self->slog(2, "blocked ip $ip"); |
|
|
258 | $self->err_blocked; |
|
|
259 | } |
|
|
260 | |
321 | |
261 | $req =~ /^(?:\015\012)? |
322 | $req =~ /^(?:\015\012)? |
262 | (GET|HEAD) \040+ |
323 | (GET|HEAD) \040+ |
263 | ([^\040]+) \040+ |
324 | ([^\040]+) \040+ |
264 | HTTP\/([0-9]+\.[0-9]+) |
325 | HTTP\/([0-9]+\.[0-9]+) |
… | |
… | |
277 | my (%hdr, $h, $v); |
338 | my (%hdr, $h, $v); |
278 | |
339 | |
279 | $hdr{lc $1} .= ",$2" |
340 | $hdr{lc $1} .= ",$2" |
280 | while $req =~ /\G |
341 | while $req =~ /\G |
281 | ([^:\000-\040]+): |
342 | ([^:\000-\040]+): |
282 | [\008\040]* |
343 | [\011\040]* |
283 | ((?: [^\015\012]+ | \015\012[\008\040] )*) |
344 | ((?: [^\015\012]+ | \015\012[\011\040] )*) |
284 | \015\012 |
345 | \015\012 |
285 | /gxc; |
346 | /gxc; |
286 | |
347 | |
287 | $req =~ /\G\015\012$/ |
348 | $req =~ /\G\015\012$/ |
288 | or $self->err(400, "bad request"); |
349 | or $self->err(400, "bad request"); |
289 | |
350 | |
290 | $self->{h}{$h} = substr $v, 1 |
351 | $self->{h}{$h} = substr $v, 1 |
291 | while ($h, $v) = each %hdr; |
352 | while ($h, $v) = each %hdr; |
292 | } |
353 | } |
293 | |
354 | |
|
|
355 | # remote id should be unique per user |
|
|
356 | my $id = $self->{remote_addr}; |
|
|
357 | |
|
|
358 | if (exists $self->{h}{"client-ip"}) { |
|
|
359 | $id .= "[".$self->{h}{"client-ip"}."]"; |
|
|
360 | } elsif (exists $self->{h}{"x-forwarded-for"}) { |
|
|
361 | $id .= "[".$self->{h}{"x-forwarded-for"}."]"; |
|
|
362 | } |
|
|
363 | |
|
|
364 | $self->{remote_id} = $id; |
|
|
365 | |
|
|
366 | weaken (local $conn{$id}{$self*1} = $self); |
|
|
367 | |
|
|
368 | if ($blocked{$id}) { |
|
|
369 | $self->err_blocked |
|
|
370 | if $blocked{$id}[0] > $::NOW; |
|
|
371 | |
|
|
372 | delete $blocked{$id}; |
|
|
373 | } |
|
|
374 | |
|
|
375 | # find out server name and port |
|
|
376 | if ($self->{uri} =~ s/^http:\/\/([^\/?#]*)//i) { |
|
|
377 | $host = $1; |
|
|
378 | } else { |
|
|
379 | $host = $self->{h}{host}; |
|
|
380 | } |
|
|
381 | |
|
|
382 | if (defined $host) { |
294 | $self->{server_port} = $self->{h}{host} =~ s/:([0-9]+)$// ? $1 : 80; |
383 | $self->{server_port} = $host =~ s/:([0-9]+)$// ? $1 : 80; |
|
|
384 | } else { |
|
|
385 | ($self->{server_port}, $host) |
|
|
386 | = unpack_sockaddr_in $self->{fh}->sockname |
|
|
387 | or $self->err(500, "unable to get socket name"); |
|
|
388 | $host = inet_ntoa $host; |
|
|
389 | } |
295 | |
390 | |
|
|
391 | $self->{server_name} = $host; |
|
|
392 | |
296 | weaken ($uri{$self->{remote_addr}}{$self->{uri}}{$self*1} = $self); |
393 | weaken (local $uri{$id}{$self->{uri}}{$self*1} = $self); |
297 | |
394 | |
298 | eval { |
395 | eval { |
299 | $self->map_uri; |
396 | $self->map_uri; |
300 | $self->respond; |
397 | $self->respond; |
301 | }; |
398 | }; |
302 | |
399 | |
303 | $self->eoconn; |
|
|
304 | |
|
|
305 | die if $@ && !ref $@; |
400 | die if $@ && !ref $@; |
306 | |
401 | |
307 | last if $self->{h}{connection} =~ /close/ || $self->{version} lt "1.1"; |
402 | last if $self->{h}{connection} =~ /close/i; |
308 | |
403 | |
309 | $self->slog(9, "persistent connection [".$self->{h}{"user-agent"}."][$self->{reqs}]"); |
404 | $httpevent->broadcast; |
|
|
405 | |
310 | $fh->timeout($::PER_TIMEOUT); |
406 | $fh->timeout($::PER_TIMEOUT); |
311 | } |
407 | } |
|
|
408 | } |
|
|
409 | |
|
|
410 | sub block { |
|
|
411 | my $self = shift; |
|
|
412 | |
|
|
413 | $blocked{$self->{remote_id}} = [$::NOW + $_[0], $_[1]]; |
|
|
414 | $self->slog(2, "blocked ip $self->{remote_id}"); |
|
|
415 | $self->err_blocked; |
312 | } |
416 | } |
313 | |
417 | |
314 | # uri => path mapping |
418 | # uri => path mapping |
315 | sub map_uri { |
419 | sub map_uri { |
316 | my $self = shift; |
420 | my $self = shift; |
317 | my $host = $self->{h}{host} || "default"; |
421 | my $host = $self->{server_name}; |
318 | my $uri = $self->{uri}; |
422 | my $uri = $self->{uri}; |
319 | |
423 | |
320 | # some massaging, also makes it more secure |
424 | # some massaging, also makes it more secure |
321 | $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; |
425 | $uri =~ s/%([0-9a-fA-F][0-9a-fA-F])/chr hex $1/ge; |
322 | $uri =~ s%//+%/%g; |
426 | $uri =~ s%//+%/%g; |
… | |
… | |
332 | $self->{path} = "$::DOCROOT/$host$uri"; |
436 | $self->{path} = "$::DOCROOT/$host$uri"; |
333 | |
437 | |
334 | $self->access_check; |
438 | $self->access_check; |
335 | } |
439 | } |
336 | |
440 | |
337 | sub server_address { |
|
|
338 | my $self = shift; |
|
|
339 | my ($port, $iaddr) = unpack_sockaddr_in $self->{fh}->getsockname |
|
|
340 | or $self->err(500, "unable to get socket name"); |
|
|
341 | ((inet_ntoa $iaddr), $port); |
|
|
342 | } |
|
|
343 | |
|
|
344 | sub server_host { |
|
|
345 | my $self = shift; |
|
|
346 | if (exists $self->{h}{host}) { |
|
|
347 | return $self->{h}{host}; |
|
|
348 | } else { |
|
|
349 | return (($self->server_address)[0]); |
|
|
350 | } |
|
|
351 | } |
|
|
352 | |
|
|
353 | sub server_hostport { |
|
|
354 | my $self = shift; |
|
|
355 | my ($host, $port); |
|
|
356 | if (exists $self->{h}{host}) { |
|
|
357 | ($host, $port) = ($self->{h}{host}, $self->{server_port}); |
|
|
358 | } else { |
|
|
359 | ($host, $port) = $self->server_address; |
|
|
360 | } |
|
|
361 | $port = $port == 80 ? "" : ":$port"; |
|
|
362 | $host.$port; |
|
|
363 | } |
|
|
364 | |
|
|
365 | sub _cgi { |
441 | sub _cgi { |
366 | my $self = shift; |
442 | my $self = shift; |
367 | my $path = shift; |
443 | my $path = shift; |
368 | my $fh; |
444 | my $fh; |
369 | |
445 | |
370 | # no two-way xxx supported |
446 | # no two-way xxx supported |
371 | if (0 == fork) { |
447 | if (0 == fork) { |
372 | open STDOUT, ">&".fileno($self->{fh}); |
448 | open STDOUT, ">&".fileno($self->{fh}); |
373 | if (chdir $::DOCROOT) { |
449 | if (chdir $::DOCROOT) { |
374 | $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike |
450 | $ENV{SERVER_SOFTWARE} = "thttpd-myhttpd"; # we are thttpd-alike |
375 | $ENV{HTTP_HOST} = $self->server_host; |
451 | $ENV{HTTP_HOST} = $self->{server_name}; |
376 | $ENV{HTTP_PORT} = $self->{server_host}; |
452 | $ENV{HTTP_PORT} = $self->{server_port}; |
377 | $ENV{SCRIPT_NAME} = $self->{name}; |
453 | $ENV{SCRIPT_NAME} = $self->{name}; |
378 | exec $path; |
454 | exec $path; |
379 | } |
455 | } |
380 | Coro::State::_exit(0); |
456 | Coro::State::_exit(0); |
381 | } else { |
457 | } else { |
|
|
458 | die; |
382 | } |
459 | } |
|
|
460 | } |
|
|
461 | |
|
|
462 | sub server_hostport { |
|
|
463 | $_[0]{server_port} == 80 |
|
|
464 | ? $_[0]{server_name} |
|
|
465 | : "$_[0]{server_name}:$_[0]{server_port}"; |
383 | } |
466 | } |
384 | |
467 | |
385 | sub respond { |
468 | sub respond { |
386 | my $self = shift; |
469 | my $self = shift; |
387 | my $path = $self->{path}; |
470 | my $path = $self->{path}; |
388 | |
471 | |
389 | stat $path |
472 | if ($self->{name} =~ s%^/internal/([^/]+)%%) { |
390 | or $self->err(404, "not found"); |
473 | if ($::internal{$1}) { |
391 | |
474 | $::internal{$1}->($self); |
392 | $self->{stat} = [stat _]; |
|
|
393 | |
|
|
394 | # idiotic netscape sends idiotic headers AGAIN |
|
|
395 | my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
|
|
396 | ? str2time $1 : 0; |
|
|
397 | |
|
|
398 | if (-d _ && -r _) { |
|
|
399 | # directory |
|
|
400 | if ($path !~ /\/$/) { |
|
|
401 | # create a redirect to get the trailing "/" |
|
|
402 | my $host = $self->server_hostport; |
|
|
403 | $self->err(301, "moved permanently", { Location => "http://$host$self->{uri}/" }); |
|
|
404 | } else { |
475 | } else { |
405 | $ims < $self->{stat}[9] |
476 | $self->err(404, "not found"); |
|
|
477 | } |
|
|
478 | } else { |
|
|
479 | |
|
|
480 | stat $path |
406 | or $self->err(304, "not modified"); |
481 | or $self->err(404, "not found"); |
407 | |
482 | |
408 | if (-r "$path/index.html") { |
483 | $self->{stat} = [stat _]; |
409 | $self->{path} .= "/index.html"; |
484 | |
410 | $self->handle_file; |
485 | # idiotic netscape sends idiotic headers AGAIN |
|
|
486 | my $ims = $self->{h}{"if-modified-since"} =~ /^([^;]+)/ |
|
|
487 | ? str2time $1 : 0; |
|
|
488 | |
|
|
489 | if (-d _ && -r _) { |
|
|
490 | # directory |
|
|
491 | if ($path !~ /\/$/) { |
|
|
492 | # create a redirect to get the trailing "/" |
|
|
493 | # we don't try to avoid the :80 |
|
|
494 | $self->err(301, "moved permanently", { Location => "http://".$self->server_hostport."$self->{uri}/" }); |
411 | } else { |
495 | } else { |
|
|
496 | $ims < $self->{stat}[9] |
|
|
497 | or $self->err(304, "not modified"); |
|
|
498 | |
|
|
499 | if (-r "$path/index.html") { |
|
|
500 | # replace directory "size" by index.html filesize |
|
|
501 | $self->{stat} = [stat ($self->{path} .= "/index.html")]; |
|
|
502 | $self->handle_file($queue_index, $tbf_top); |
|
|
503 | } else { |
412 | $self->handle_dir; |
504 | $self->handle_dir; |
413 | } |
505 | } |
414 | } |
506 | } |
415 | } elsif (-f _ && -r _) { |
507 | } elsif (-f _ && -r _) { |
416 | -x _ and $self->err(403, "forbidden"); |
508 | -x _ and $self->err(403, "forbidden"); |
417 | $self->handle_file; |
509 | |
|
|
510 | if (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) { |
|
|
511 | my $timeout = $::NOW + 10; |
|
|
512 | while (keys %{$conn{$self->{remote_id}}} > $::MAX_TRANSFERS_IP) { |
|
|
513 | if ($timeout < $::NOW) { |
|
|
514 | $self->block($::BLOCKTIME, "too many connections"); |
|
|
515 | } else { |
|
|
516 | $httpevent->wait; |
|
|
517 | } |
|
|
518 | } |
|
|
519 | } |
|
|
520 | |
|
|
521 | $self->handle_file($queue_file, $tbf_top); |
418 | } else { |
522 | } else { |
419 | $self->err(404, "not found"); |
523 | $self->err(404, "not found"); |
|
|
524 | } |
420 | } |
525 | } |
421 | } |
526 | } |
422 | |
527 | |
423 | sub handle_dir { |
528 | sub handle_dir { |
424 | my $self = shift; |
529 | my $self = shift; |
425 | my $idx = $self->diridx; |
530 | my $idx = $self->diridx; |
426 | |
531 | |
427 | $self->response(200, "ok", |
532 | $self->response(200, "ok", |
428 | { |
533 | { |
429 | "Content-Type" => "text/html", |
534 | "Content-Type" => "text/html; charset=utf-8", |
430 | "Content-Length" => length $idx, |
535 | "Content-Length" => length $idx, |
|
|
536 | "Last-Modified" => time2str ($self->{stat}[9]), |
431 | }, |
537 | }, |
432 | $idx); |
538 | $idx); |
433 | } |
539 | } |
434 | |
540 | |
435 | sub handle_file { |
541 | sub handle_file { |
436 | my $self = shift; |
542 | my ($self, $queue, $tbf) = @_; |
437 | my $length = -s _; |
543 | my $length = $self->{stat}[7]; |
438 | my $hdr = { |
544 | my $hdr = { |
439 | "Last-Modified" => time2str ((stat _)[9]), |
545 | "Last-Modified" => time2str ((stat _)[9]), |
|
|
546 | "Accept-Ranges" => "bytes", |
440 | }; |
547 | }; |
441 | |
548 | |
442 | my @code = (200, "ok"); |
549 | my @code = (200, "ok"); |
443 | my ($l, $h); |
550 | my ($l, $h); |
444 | |
551 | |
… | |
… | |
454 | } |
561 | } |
455 | goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l; |
562 | goto satisfiable if $l >= 0 && $l < $length && $h >= 0 && $h >= $l; |
456 | } |
563 | } |
457 | $hdr->{"Content-Range"} = "bytes */$length"; |
564 | $hdr->{"Content-Range"} = "bytes */$length"; |
458 | $hdr->{"Content-Length"} = $length; |
565 | $hdr->{"Content-Length"} = $length; |
459 | $self->slog(9, "not satisfiable($self->{h}{range}|".$self->{h}{"user-agent"}.")"); |
|
|
460 | $self->err(416, "not satisfiable", $hdr, ""); |
566 | $self->err(416, "not satisfiable", $hdr, ""); |
461 | |
567 | |
462 | satisfiable: |
568 | satisfiable: |
463 | # check for segmented downloads |
569 | # check for segmented downloads |
464 | if ($l && $::NO_SEGMENTED) { |
570 | if ($l && $::NO_SEGMENTED) { |
|
|
571 | my $timeout = $::NOW + 15; |
465 | if (%{$uri{$self->{remote_addr}}{$self->{uri}}} > 1) { |
572 | while (keys %{$uri{$self->{remote_id}}{$self->{uri}}} > 1) { |
466 | $self->err(400, "segmented downloads are not allowed", |
573 | if ($timeout <= $::NOW) { |
467 | { "Content-Type" => "text/html", Connection => "close" }, <<EOF); |
574 | $self->block($::BLOCKTIME, "segmented downloads are forbidden"); |
468 | <html> |
575 | #$self->err_segmented_download; |
469 | <head> |
576 | } else { |
470 | <title>Segmented downloads are not allowed</title> |
577 | $httpevent->wait; |
471 | </head> |
578 | } |
472 | <body bgcolor="#ffffff" text="#000000" link="#0000ff" vlink="#000080" alink="#ff0000"> |
|
|
473 | |
|
|
474 | <p>Segmented downloads are not allowed on this server. Please refer to the |
|
|
475 | <a href="http://www.goof.com/pcg/marc/animefaq.html#segmented_downloads">FAQ</a>.</p> |
|
|
476 | |
|
|
477 | </body></html> |
|
|
478 | EOF |
|
|
479 | EOF |
|
|
480 | } |
579 | } |
481 | } |
580 | } |
482 | |
581 | |
483 | $hdr->{"Content-Range"} = "bytes $l-$h/$length"; |
582 | $hdr->{"Content-Range"} = "bytes $l-$h/$length"; |
484 | @code = (206, "partial content"); |
583 | @code = (206, "partial content"); |
… | |
… | |
494 | $hdr->{"Content-Length"} = $length; |
593 | $hdr->{"Content-Length"} = $length; |
495 | |
594 | |
496 | $self->response(@code, $hdr, ""); |
595 | $self->response(@code, $hdr, ""); |
497 | |
596 | |
498 | if ($self->{method} eq "GET") { |
597 | if ($self->{method} eq "GET") { |
|
|
598 | $self->{time} = $::NOW; |
|
|
599 | $self->{written} = 0; |
|
|
600 | |
|
|
601 | my $current = $Coro::current; |
|
|
602 | |
499 | my ($fh, $buf, $r); |
603 | my ($fh, $buf, $r); |
500 | my $current = $Coro::current; |
604 | |
501 | open $fh, "<", $self->{path} |
605 | open $fh, "<", $self->{path} |
502 | or die "$self->{path}: late open failure ($!)"; |
606 | or die "$self->{path}: late open failure ($!)"; |
503 | |
607 | |
504 | $h -= $l - 1; |
608 | $h -= $l - 1; |
505 | |
609 | |
506 | if (0) { |
610 | if (0) { # !AIO |
507 | if ($l) { |
611 | if ($l) { |
508 | sysseek $fh, $l, 0; |
612 | sysseek $fh, $l, 0; |
509 | } |
613 | } |
510 | } |
614 | } |
|
|
615 | |
|
|
616 | my $transfer = $queue->start_transfer($h); |
|
|
617 | my $locked; |
|
|
618 | my $bufsize = $::WAIT_BUFSIZE; # initial buffer size |
511 | |
619 | |
512 | while ($h > 0) { |
620 | while ($h > 0) { |
|
|
621 | unless ($locked) { |
|
|
622 | if ($locked ||= $transfer->try($::WAIT_INTERVAL)) { |
|
|
623 | $bufsize = $::BUFSIZE; |
|
|
624 | $self->{time} = $::NOW; |
|
|
625 | $self->{written} = 0; |
|
|
626 | } |
|
|
627 | } |
|
|
628 | |
|
|
629 | if ($blocked{$self->{remote_id}}) { |
|
|
630 | $self->{h}{connection} = "close"; |
|
|
631 | die bless {}, err::; |
|
|
632 | } |
|
|
633 | |
513 | if (0) { |
634 | if (0) { # !AIO |
514 | sysread $fh, $buf, $h > $::BUFSIZE ? $::BUFSIZE : $h |
635 | sysread $fh, $buf, $h > $bufsize ? $bufsize : $h |
515 | or last; |
636 | or last; |
516 | } else { |
637 | } else { |
517 | aio_read($fh, $l, ($h > $::BUFSIZE ? $::BUFSIZE : $h), |
638 | aio_read($fh, $l, ($h > $bufsize ? $bufsize : $h), |
518 | $buf, 0, sub { |
639 | $buf, 0, sub { |
519 | $r = $_[0]; |
640 | $r = $_[0]; |
520 | $current->ready; |
641 | Coro::ready($current); |
521 | }); |
642 | }); |
522 | &Coro::schedule; |
643 | &Coro::schedule; |
523 | last unless $r; |
644 | last unless $r; |
524 | } |
645 | } |
525 | my $w = $self->{fh}->syswrite($buf) |
646 | |
|
|
647 | $tbf->request(length $buf); |
|
|
648 | my $w = syswrite $self->{fh}, $buf |
526 | or last; |
649 | or last; |
527 | $::written += $w; |
650 | $::written += $w; |
528 | $self->{written} += $w; |
651 | $self->{written} += $w; |
529 | $l += $r; |
652 | $l += $r; |
530 | } |
653 | } |
531 | } |
|
|
532 | |
654 | |
533 | close $fh; |
655 | close $fh; |
|
|
656 | } |
534 | } |
657 | } |
535 | |
658 | |
536 | 1; |
659 | 1; |