ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/netgeo.pl
Revision: 1.19
Committed: Sat Jan 23 21:27:51 2010 UTC (14 years, 6 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.18: +9 -1 lines
Log Message:
*** empty log message ***

File Contents

# Content
1 #!/usr/bin/perl
2
3 # APNIC refer: KRNIC (for 211.104.0.0)
4
5 use Socket;
6 use Fcntl;
7
8 use Coro;
9 use Coro::EV;
10 use Coro::Semaphore;
11 use Coro::SemaphoreSet;
12 use Coro::Socket;
13 use Coro::Timer;
14
15 use BerkeleyDB;
16
17 tie %netgeo::whois, BerkeleyDB::Btree,
18 -Env => $db_env,
19 -Filename => "whois",
20 -Flags => DB_CREATE,
21 or die "unable to create/open whois table";
22 $netgeo::iprange = new BerkeleyDB::Btree
23 -Env => $db_env,
24 -Filename => "iprange",
25 -Flags => DB_CREATE,
26 or die "unable to create/open iprange table";
27
28 sub clear_cache() {
29 %netgeo::whois = ();
30 $netgeo::iprange->truncate (my $dummy);
31 }
32
33 package Whois;
34
35 use Coro::EV;
36
37 sub new {
38 my $class = shift;
39 my $name = shift;
40 my $ip = shift;
41 my $self = bless { name => $name, ip => $ip, @_ }, $class;
42 $self->{maxjobs} = new Coro::Semaphore $self->{maxjobs} || 1;
43 $self;
44 }
45
46 sub ip {
47 $_[0]{ip};
48 }
49
50 sub sanitize {
51 $_[1];
52 }
53
54 sub whois_request {
55 my ($self, $query) = @_;
56
57 my $id = "$self->{name}\x0$query";
58 my $whois = $netgeo::whois{$id};
59
60 unless (defined $whois) {
61 print "WHOIS($self->{name},$query)\n";
62
63 my $guard = $self->{maxjobs}->guard;
64 my $timeout = 5;
65
66 while () {
67 my $fh = new Coro::Socket
68 PeerAddr => $self->ip,
69 PeerPort => $self->{port} || "whois",
70 Timeout => 30;
71 if ($fh) {
72 print $fh "$query\n";
73 $fh->read($whois, 16*1024); # max 16k. whois stored
74 close $fh;
75 $whois =~ s/\015?\012/\n/g;
76 $whois = $self->sanitize($whois);
77 if ($whois eq ""
78 or ($whois =~ /query limit/i && $whois =~ /exceeded/i) # ARIN
79 or ($whois =~ /wait a while and try again/i) # ARIN
80 or ($whois =~ /^%ERROR:202:/) # RIPE/APNIC
81 ) {
82 print "retrying in $timeout seconds\n";#d#
83 do_timer(desc => "timer2", after => $timeout);
84 $timeout *= 2;
85 $timeout = 1 if $timeout > 600;
86 } else {
87 last;
88 }
89 } else {
90 # only retry once a minute
91 print STDERR "unable to connect to $self->{ip} ($self->{name}), retrying...\n";
92 Coro::Timer::sleep 300;
93 }
94 }
95
96 $netgeo::whois{$id} = $whois;
97 }
98
99 $whois;
100 }
101
102 package Whois::ARIN;
103
104 use Date::Parse;
105
106 use base Whois;
107
108 sub sanitize {
109 local $_ = $_[1];
110 s/\n[\t ]{6,}([0-9.]+ - [0-9.]+)/ $1/g;
111 $_;
112 }
113
114 # there are only two problems with arin's whois database:
115 # a) the data cannot be trusted and often is old or even wrong
116 # b) the database format is nonparsable
117 # (no spaces between netname/ip and netnames can end in digits ;)
118 # of course, the only source to find out about global
119 # address distribution is... arin.
120 sub ip_request {
121 my ($self, $ip) = @_;
122
123 my $whois = $self->whois_request($ip);
124
125 return if $whois =~ /^No match/;
126
127 if ($whois =~ /^To single out one record/m) {
128 my $handle;
129 while ($whois =~ /\G\S.*\(([A-Z0-9\-]+)\).*\n/mg) {
130 $handle = $1;
131 #return if $handle =~ /-(RIPE|APNIC)/; # heuristic, but bad because ripe might not have better info
132 }
133 $handle or die "$whois ($ip): unparseable multimatch\n";
134 $whois = $self->whois_request("!$handle");
135 }
136
137 my ($address, $info, $coordinator, undef) = split /\n\n/, $whois;
138
139 $info =~ /^\s+Netname: (\S+)$/mi
140 or die "$whois($ip): no netname\n";
141 my $netname = $1;
142
143 $info =~ /^\s+Netblock: ([0-9.]+\s+-\s+[0-9.]+)\s*$/mi
144 or die "$whois($ip): no netblock\n";
145 my $netblock = $1;
146
147 my $maintainer;
148
149 if ($info =~ /^\s+Maintainer: (\S+)\s*$/mi) {
150 $maintainer = "*ma: $1\n";
151 return if $1 =~ /^(?:AP|RIPE)$/;
152 }
153
154 $coordinator =~ s/^\s+Coordinator:\s*//si
155 or $coordinator = "";
156
157 $address =~ s/\n\s*(\S+)$//
158 or die "$whois($ip): no parseable country ($address)\n";
159 my $country = $1;
160
161 $address =~ s/^\s*/*de: /mg;
162 $coordinator =~ s/^\s*/*ad: /mg;
163
164 $whois = <<EOF;
165 *in: $netblock
166 *na: $netname
167 *cy: $country
168 $maintainer$address
169 $coordinator
170 EOF
171 $whois =~ s/\n+$//;
172 $whois;
173 }
174
175 package Whois::RIPE;
176
177 use Socket;
178 use base Whois;
179
180 sub sanitize {
181 local $_ = $_[1];
182
183 s/^%.*\n//gm;
184 s/^\n+//;
185 s/\n*$/\n/;
186
187 s/^inetnum:\s+/*in: /gm;
188 s/^admin-c:\s+/*ac: /gm;
189 s/^tech-c:\s+/*tc: /gm;
190 s/^owner-c:\s+/*oc: /gm;
191 s/^country:\s+/*cy: /gm;
192 s/^phone:\s+/*ph: /gm;
193 s/^remarks:\s+/*rm: /gm;
194 s/^changed:\s+/*ch: /gm;
195 s/^created:\s+/*cr: /gm;
196 s/^address:\s+/*ad: /gm;
197 s/^status:\s+/*st: /gm;
198 s/^inetrev:\s+/*ir: /gm;
199 s/^nserver:\s+/*ns: /gm;
200
201 $_;
202 }
203
204 sub ip_request {
205 my ($self, $ip) = @_;
206
207 my $whois = $self->whois_request("$self->{rflags}$ip");
208
209 $whois =~ s{
210 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
211 (?:\.
212 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
213 (?:\.
214 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
215 (?:\.
216 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
217 )?
218 )?
219 )?
220 /
221 ([0-9]+)
222 }{
223 my $ip = inet_aton sprintf "%d.%d.%d.%d", $1, $2, $3, $4;
224 my $net = 1 << (31 - $5);
225 my $mask = inet_aton 2 ** 32 - $net;
226
227 my $ip1 = $ip & $mask;
228 my $ip2 = $ip1 | inet_aton $net * 2 - 1;
229 (inet_ntoa $ip1) . " - " . (inet_ntoa $ip2);
230 }gex;
231
232 $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/
233 and return;
234
235 $whois =~ /^\*de: This network range is not allocated to /m # APINIC e.g. 24.0.0.0
236 and return;
237
238 $whois =~ /^\*de: Not allocated by APNIC/m # APINIC e.g. 189.47.24.97
239 and return;
240
241 $whois =~ /^\*ac: XXX0/m # 192.0.0.0
242 and return;
243
244 $whois =~ /^\*st: (?:ALLOCATED )?UNSPECIFIED/m
245 and return;
246
247 $whois =~ /^%ERROR:/m
248 and return;
249
250 #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) {
251 # $whois .= $self->whois_request("-FSTpn $1");
252 #}
253
254 #$whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg;
255
256 $whois =~ s/\n+$//;
257
258 $whois;
259 }
260
261 package Whois::RWHOIS;
262
263 use base Whois;
264
265 sub sanitize {
266 local $_ = $_[1];
267 s/^%referral\s+/referral:/gm;
268 s/^network://gm;
269 s/^%.*\n//gm;
270 s/^\n+//m;
271 s/\n*$/\n/m;
272
273 s/^(\S+):\s*/\L$1: /gm;
274 s/^ip-network-block:/*in:/gm;
275 s/^country-code:/*cy:/gm;
276 s/^tech-contact;i:/*tc:/gm;
277 s/^updated:/*ch:/gm;
278 s/^street-address:/*ad:/gm;
279 s/^org-name:/*rm:/gm;
280 s/^created:/*cr:/gm;
281
282 $_;
283 }
284
285 sub ip_request {
286 my ($self, $ip) = @_;
287
288 my $whois = $self->whois_request("$ip");
289
290 $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/
291 and return;
292
293 $whois =~ /^\*ac: XXX0/m # 192.0.0.0
294 and return;
295
296 $whois =~ /^%ERROR:/m
297 and return;
298
299 #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) {
300 # $whois .= $self->whois_request("-FSTpn $1");
301 #}
302
303 $whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg;
304
305 $whois =~ s/\n+$//;
306
307 $whois;
308 }
309
310 package netgeo;
311
312 use Socket;
313 use BerkeleyDB;
314
315 sub ip2int($) {
316 unpack "N", inet_aton $_[0];
317 }
318
319 sub int2ip($) {
320 inet_ntoa pack "N", $_[0];
321 }
322
323 our %WHOIS;
324
325 #$WHOIS{ARIN} = new Whois::ARIN ARIN => "whois.arin.net", port => 43, maxjobs => 12;
326 $WHOIS{ARIN} = new Whois::RWHOIS ARIN => "rwhois.arin.net", port => 4321, maxjobs => 12;
327 $WHOIS{RIPE} = new Whois::RIPE RIPE => "whois.ripe.net", port => 43, rflags => "-FTin ", maxjobs => 20;
328 $WHOIS{APNIC} = new Whois::RIPE APNIC => "whois.apnic.net", port => 43, rflags => "-FTin ", maxjobs => 20;
329 $WHOIS{LACNIC} = new Whois::RIPE LACNIC => "whois.lacnic.net", port => 43, maxjobs => 20;
330
331 $whoislock = new Coro::SemaphoreSet;
332
333 sub ip_request {
334 my $ip = $_[0];
335
336 my $guard = $whoislock->guard($ip);
337
338 my $c = $iprange->db_cursor;
339 my $v;
340
341 if (!$c->c_get((inet_aton $ip), $v, DB_SET_RANGE)) {
342 my ($ip0, $ip1, $whois) = split /\x0/, $v;
343 my $_ip = ip2int $ip;
344 if ($ip0 <= $_ip && $_ip <= $ip1) {
345 return $whois;
346 }
347 }
348
349 my ($arin, $ripe, $apnic);
350
351 $whois = $WHOIS{RIPE}->ip_request($ip)
352 || $WHOIS{APNIC} ->ip_request($ip)
353 || $WHOIS{ARIN} ->ip_request($ip)
354 || $WHOIS{LACNIC}->ip_request($ip)
355 ;
356
357 $whois =~ /^\*in: ([0-9.]+)\s+-\s+([0-9.]+)\s*$/mi
358 or do { warn "$whois($ip): no addresses found\n", last };
359
360 my ($ip0, $ip1) = ($1, $2);
361
362 my $_ip = ip2int($ip);
363 my $_ip0 = ip2int($ip0);
364 my $_ip1 = ip2int($ip1);
365
366 if ($_ip0 + 256 < $_ip1) {
367 $_ip = $_ip & 0xffffff00;
368 $_ip0 = $_ip if $_ip0 < $_ip;
369 $_ip1 = $_ip + 255 if $_ip1 > $_ip + 255;
370 }
371
372 $iprange->db_put((pack "N", $_ip1), (join "\x0", $_ip0, $_ip1, $whois));
373 (tied %whois)->db_sync;
374 $iprange->db_sync;
375
376 $whois;
377 }
378
379 if (0) {
380 #print ip_request "68.52.164.8"; # goof
381 #print "\n\n";
382 #print ip_request "200.202.220.222"; # lacnic
383 #print "\n\n";
384 #print ip_request "62.116.167.250";
385 #print "\n\n";
386 #print ip_request "133.11.128.254"; # jp
387 #print "\n\n";
388 print ip_request "80.131.153.93";
389 print "\n\n";
390 }
391
392 1;
393
394