1 |
#!/usr/bin/perl |
2 |
|
3 |
# APNIC refer: KRNIC (for 211.104.0.0) |
4 |
|
5 |
use Socket; |
6 |
use Fcntl; |
7 |
|
8 |
use Coro; |
9 |
use Coro::Event; |
10 |
use Coro::Semaphore; |
11 |
use Coro::SemaphoreSet; |
12 |
use Coro::Socket; |
13 |
use Coro::Timer; |
14 |
|
15 |
use BerkeleyDB; |
16 |
|
17 |
$Event::DIED = sub { |
18 |
Event::verbose_exception_handler(@_); |
19 |
#Event::unloop_all(); |
20 |
}; |
21 |
|
22 |
tie %netgeo::whois, BerkeleyDB::Btree, |
23 |
-Env => $db_env, |
24 |
-Filename => "whois", |
25 |
-Flags => DB_CREATE, |
26 |
or die "unable to create/open whois table"; |
27 |
$netgeo::iprange = new BerkeleyDB::Btree |
28 |
-Env => $db_env, |
29 |
-Filename => "iprange", |
30 |
-Flags => DB_CREATE, |
31 |
or die "unable to create/open iprange table"; |
32 |
|
33 |
package Whois; |
34 |
|
35 |
use Coro::Event; |
36 |
|
37 |
sub new { |
38 |
my $class = shift; |
39 |
my $name = shift; |
40 |
my $ip = shift; |
41 |
my $self = bless { name => $name, ip => $ip, @_ }, $class; |
42 |
$self->{maxjobs} = new Coro::Semaphore $self->{maxjobs} || 1; |
43 |
$self; |
44 |
} |
45 |
|
46 |
sub ip { |
47 |
$_[0]{ip}; |
48 |
} |
49 |
|
50 |
sub sanitize { |
51 |
$_[1]; |
52 |
} |
53 |
|
54 |
sub whois_request { |
55 |
my ($self, $query) = @_; |
56 |
|
57 |
my $id = "$self->{name}\x0$query"; |
58 |
my $whois = $netgeo::whois{$id}; |
59 |
|
60 |
unless (defined $whois) { |
61 |
print "WHOIS($self->{name},$query)\n"; |
62 |
|
63 |
my $guard = $self->{maxjobs}->guard; |
64 |
my $timeout = 5; |
65 |
|
66 |
while () { |
67 |
my $fh = new Coro::Socket |
68 |
PeerAddr => $self->ip, |
69 |
PeerPort => $self->{port} || "whois", |
70 |
Timeout => 30; |
71 |
if ($fh) { |
72 |
print $fh "$query\n"; |
73 |
$fh->read($whois, 16*1024); # max 16k. whois stored |
74 |
close $fh; |
75 |
$whois =~ s/\015?\012/\n/g; |
76 |
$whois = $self->sanitize($whois); |
77 |
if ($whois eq "" |
78 |
or ($whois =~ /query limit/i && $whois =~ /exceeded/i) # ARIN |
79 |
or ($whois =~ /wait a while and try again/i) # ARIN |
80 |
or ($whois =~ /^%ERROR:202:/) # RIPE/APNIC |
81 |
) { |
82 |
print "retrying in $timeout seconds\n";#d# |
83 |
do_timer(desc => "timer2", after => $timeout); |
84 |
$timeout *= 2; |
85 |
$timeout = 1 if $timeout > 600; |
86 |
} else { |
87 |
last; |
88 |
} |
89 |
} else { |
90 |
# only retry once a minute |
91 |
print STDERR "unable to connect to $self->{ip} ($self->{name}), retrying...\n"; |
92 |
Coro::Timer::sleep 300; |
93 |
} |
94 |
} |
95 |
|
96 |
$netgeo::whois{$id} = $whois; |
97 |
} |
98 |
|
99 |
$whois; |
100 |
} |
101 |
|
102 |
package Whois::ARIN; |
103 |
|
104 |
use Date::Parse; |
105 |
|
106 |
use base Whois; |
107 |
|
108 |
sub sanitize { |
109 |
local $_ = $_[1]; |
110 |
s/\n[\t ]{6,}([0-9.]+ - [0-9.]+)/ $1/g; |
111 |
$_; |
112 |
} |
113 |
|
114 |
# there are only two problems with arin's whois database: |
115 |
# a) the data cannot be trusted and often is old or even wrong |
116 |
# b) the database format is nonparsable |
117 |
# (no spaces between netname/ip and netnames can end in digits ;) |
118 |
# of course, the only source to find out about global |
119 |
# address distribution is... arin. |
120 |
sub ip_request { |
121 |
my ($self, $ip) = @_; |
122 |
|
123 |
my $whois = $self->whois_request($ip); |
124 |
|
125 |
return () if $whois =~ /^No match/; |
126 |
|
127 |
if ($whois =~ /^To single out one record/m) { |
128 |
my $handle; |
129 |
while ($whois =~ /\G\S.*\(([A-Z0-9\-]+)\).*\n/mg) { |
130 |
$handle = $1; |
131 |
#return if $handle =~ /-(RIPE|APNIC)/; # heuristic, bbut bad because ripe might not have better info |
132 |
} |
133 |
$handle or die "$whois ($ip): unparseable multimatch\n"; |
134 |
$whois = $self->whois_request("!$handle"); |
135 |
} |
136 |
|
137 |
my ($address, $info, $coordinator, undef) = split /\n\n/, $whois; |
138 |
|
139 |
$info =~ /^\s+Netname: (\S+)$/mi |
140 |
or die "$whois($ip): no netname\n"; |
141 |
my $netname = $1; |
142 |
|
143 |
$info =~ /^\s+Netblock: ([0-9.]+\s+-\s+[0-9.]+)\s*$/mi |
144 |
or die "$whois($ip): no netblock\n"; |
145 |
my $netblock = $1; |
146 |
|
147 |
my $maintainer; |
148 |
|
149 |
if ($info =~ /^\s+Maintainer: (\S+)\s*$/mi) { |
150 |
$maintainer = "*ma: $1\n"; |
151 |
return if $1 =~ /^(?:AP|RIPE)$/; |
152 |
} |
153 |
|
154 |
$coordinator =~ s/^\s+Coordinator:\s*//si |
155 |
or $coordinator = ""; |
156 |
|
157 |
$address =~ s/\n\s*(\S+)$// |
158 |
or die "$whois($ip): no parseable country ($address)\n"; |
159 |
my $country = $1; |
160 |
|
161 |
$address =~ s/^\s*/*de: /mg; |
162 |
$coordinator =~ s/^\s*/*ad: /mg; |
163 |
|
164 |
$whois = <<EOF; |
165 |
*in: $netblock |
166 |
*na: $netname |
167 |
*cy: $country |
168 |
$maintainer$address |
169 |
$coordinator |
170 |
EOF |
171 |
$whois =~ s/\n+$//; |
172 |
$whois; |
173 |
} |
174 |
|
175 |
package Whois::RIPE; |
176 |
|
177 |
use Socket; |
178 |
use base Whois; |
179 |
|
180 |
sub sanitize { |
181 |
local $_ = $_[1]; |
182 |
|
183 |
s/^%.*\n//gm; |
184 |
s/^\n+//; |
185 |
s/\n*$/\n/; |
186 |
|
187 |
s/^inetnum:\s+/*in: /gm; |
188 |
s/^admin-c:\s+/*ac: /gm; |
189 |
s/^tech-c:\s+/*tc: /gm; |
190 |
s/^owner-c:\s+/*oc: /gm; |
191 |
s/^country:\s+/*cy: /gm; |
192 |
s/^phone:\s+/*ph: /gm; |
193 |
s/^remarks:\s+/*rm: /gm; |
194 |
s/^changed:\s+/*ch: /gm; |
195 |
s/^created:\s+/*cr: /gm; |
196 |
s/^address:\s+/*ad: /gm; |
197 |
s/^status:\s+/*st: /gm; |
198 |
s/^inetrev:\s+/*ir: /gm; |
199 |
s/^nserver:\s+/*ns: /gm; |
200 |
|
201 |
$_; |
202 |
} |
203 |
|
204 |
sub ip_request { |
205 |
my ($self, $ip) = @_; |
206 |
|
207 |
my $whois = $self->whois_request("$self->{rflags}$ip"); |
208 |
|
209 |
$whois =~ s{ |
210 |
(2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9]) |
211 |
(?:\. |
212 |
(2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9]) |
213 |
(?:\. |
214 |
(2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9]) |
215 |
(?:\. |
216 |
(2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9]) |
217 |
)? |
218 |
)? |
219 |
)? |
220 |
/ |
221 |
([0-9]+) |
222 |
}{ |
223 |
my $ip = inet_aton sprintf "%d.%d.%d.%d", $1, $2, $3, $4; |
224 |
my $net = 1 << (31 - $5); |
225 |
my $mask = inet_aton 2 ** 32 - $net; |
226 |
|
227 |
my $ip1 = $ip & $mask; |
228 |
my $ip2 = $ip1 | inet_aton $net * 2 - 1; |
229 |
(inet_ntoa $ip1) . " - " . (inet_ntoa $ip2); |
230 |
}gex; |
231 |
|
232 |
$whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/ |
233 |
and return; |
234 |
|
235 |
$whois =~ /^\*ac: XXX0/m # 192.0.0.0 |
236 |
and return; |
237 |
|
238 |
$whois =~ /^\*st: (?:ALLOCATED )?UNSPECIFIED/m |
239 |
and return; |
240 |
|
241 |
$whois =~ /^%ERROR:/m |
242 |
and return; |
243 |
|
244 |
#while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) { |
245 |
# $whois .= $self->whois_request("-FSTpn $1"); |
246 |
#} |
247 |
|
248 |
#$whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg; |
249 |
|
250 |
$whois =~ s/\n+$//; |
251 |
|
252 |
$whois; |
253 |
} |
254 |
|
255 |
package Whois::RWHOIS; |
256 |
|
257 |
use base Whois; |
258 |
|
259 |
sub sanitize { |
260 |
local $_ = $_[1]; |
261 |
s/^%referral\s+/referral:/gm; |
262 |
s/^network://gm; |
263 |
s/^%.*\n//gm; |
264 |
s/^\n+//m; |
265 |
s/\n*$/\n/m; |
266 |
|
267 |
s/^(\S+):\s*/\L$1: /gm; |
268 |
s/^ip-network-block:/*in:/gm; |
269 |
s/^country-code:/*cy:/gm; |
270 |
s/^tech-contact;i:/*tc:/gm; |
271 |
s/^updated:/*ch:/gm; |
272 |
s/^street-address:/*ad:/gm; |
273 |
s/^org-name:/*rm:/gm; |
274 |
s/^created:/*cr:/gm; |
275 |
|
276 |
$_; |
277 |
} |
278 |
|
279 |
sub ip_request { |
280 |
my ($self, $ip) = @_; |
281 |
|
282 |
my $whois = $self->whois_request("$ip"); |
283 |
|
284 |
$whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/ |
285 |
and return; |
286 |
|
287 |
$whois =~ /^\*ac: XXX0/m # 192.0.0.0 |
288 |
and return; |
289 |
|
290 |
$whois =~ /^%ERROR:/m |
291 |
and return; |
292 |
|
293 |
#while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) { |
294 |
# $whois .= $self->whois_request("-FSTpn $1"); |
295 |
#} |
296 |
|
297 |
$whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg; |
298 |
|
299 |
$whois =~ s/\n+$//; |
300 |
|
301 |
$whois; |
302 |
} |
303 |
|
304 |
package netgeo; |
305 |
|
306 |
use Socket; |
307 |
use BerkeleyDB; |
308 |
|
309 |
sub ip2int($) { |
310 |
unpack "N", inet_aton $_[0]; |
311 |
} |
312 |
|
313 |
sub int2ip($) { |
314 |
inet_ntoa pack "N", $_[0]; |
315 |
} |
316 |
|
317 |
our %WHOIS; |
318 |
|
319 |
#$WHOIS{ARIN} = new Whois::ARIN ARIN => "whois.arin.net", port => 43, maxjobs => 12; |
320 |
$WHOIS{ARIN} = new Whois::RWHOIS ARIN => "rwhois.arin.net", port => 4321, maxjobs => 12; |
321 |
$WHOIS{RIPE} = new Whois::RIPE RIPE => "whois.ripe.net", port => 43, rflags => "-FTin ", maxjobs => 20; |
322 |
$WHOIS{APNIC} = new Whois::RIPE APNIC => "whois.apnic.net", port => 43, rflags => "-FTin ", maxjobs => 20; |
323 |
$WHOIS{LACNIC} = new Whois::RIPE LACNIC => "whois.lacnic.net", port => 43, maxjobs => 20; |
324 |
|
325 |
$whoislock = new Coro::SemaphoreSet; |
326 |
|
327 |
sub ip_request { |
328 |
my $ip = $_[0]; |
329 |
|
330 |
my $guard = $whoislock->guard($ip); |
331 |
|
332 |
my $c = $iprange->db_cursor; |
333 |
my $v; |
334 |
|
335 |
if (!$c->c_get((inet_aton $ip), $v, DB_SET_RANGE)) { |
336 |
my ($ip0, $ip1, $whois) = split /\x0/, $v; |
337 |
my $_ip = ip2int $ip; |
338 |
if ($ip0 <= $_ip && $_ip <= $ip1) { |
339 |
return $whois; |
340 |
} |
341 |
} |
342 |
|
343 |
my ($arin, $ripe, $apnic); |
344 |
|
345 |
$whois = $WHOIS{RIPE}->ip_request($ip) |
346 |
|| $WHOIS{APNIC} ->ip_request($ip) |
347 |
|| $WHOIS{ARIN} ->ip_request($ip) |
348 |
# || $WHOIS{LACNIC}->ip_request($ip) |
349 |
; |
350 |
|
351 |
$whois =~ /^\*in: ([0-9.]+)\s+-\s+([0-9.]+)\s*$/mi |
352 |
or do { warn "$whois($ip): no addresses found\n", last }; |
353 |
|
354 |
my ($ip0, $ip1) = ($1, $2); |
355 |
|
356 |
my $_ip = ip2int($ip); |
357 |
my $_ip0 = ip2int($ip0); |
358 |
my $_ip1 = ip2int($ip1); |
359 |
|
360 |
if ($_ip0 + 256 < $_ip1) { |
361 |
$_ip = $_ip & 0xffffff00; |
362 |
$_ip0 = $_ip if $_ip0 < $_ip; |
363 |
$_ip1 = $_ip + 255 if $_ip1 > $_ip + 255; |
364 |
} |
365 |
|
366 |
$iprange->db_put((pack "N", $_ip1), (join "\x0", $_ip0, $_ip1, $whois)); |
367 |
(tied %whois)->db_sync; |
368 |
$iprange->db_sync; |
369 |
|
370 |
$whois; |
371 |
} |
372 |
|
373 |
if (0) { |
374 |
#print ip_request "68.52.164.8"; # goof |
375 |
#print "\n\n"; |
376 |
#print ip_request "200.202.220.222"; # lacnic |
377 |
#print "\n\n"; |
378 |
#print ip_request "62.116.167.250"; |
379 |
#print "\n\n"; |
380 |
#print ip_request "133.11.128.254"; # jp |
381 |
#print "\n\n"; |
382 |
print ip_request "80.131.153.93"; |
383 |
print "\n\n"; |
384 |
} |
385 |
|
386 |
1; |
387 |
|
388 |
|