ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/netgeo.pl
Revision: 1.16
Committed: Sat Sep 17 20:21:11 2005 UTC (18 years, 10 months ago) by root
Content type: text/plain
Branch: MAIN
Changes since 1.15: +3 -2 lines
Log Message:
*** empty log message ***

File Contents

# User Rev Content
1 root 1.1 #!/usr/bin/perl
2    
3     # APNIC refer: KRNIC (for 211.104.0.0)
4    
5     use Socket;
6     use Fcntl;
7    
8     use Coro;
9     use Coro::Event;
10     use Coro::Semaphore;
11 root 1.6 use Coro::SemaphoreSet;
12 root 1.1 use Coro::Socket;
13 root 1.13 use Coro::Timer;
14 root 1.1
15 root 1.7 use BerkeleyDB;
16    
17 root 1.1 $Event::DIED = sub {
18     Event::verbose_exception_handler(@_);
19     #Event::unloop_all();
20     };
21    
22 root 1.4 tie %netgeo::whois, BerkeleyDB::Btree,
23     -Env => $db_env,
24     -Filename => "whois",
25     -Flags => DB_CREATE,
26     or die "unable to create/open whois table";
27     $netgeo::iprange = new BerkeleyDB::Btree
28     -Env => $db_env,
29     -Filename => "iprange",
30     -Flags => DB_CREATE,
31     or die "unable to create/open iprange table";
32    
33 root 1.1 package Whois;
34    
35     use Coro::Event;
36    
37     sub new {
38     my $class = shift;
39     my $name = shift;
40     my $ip = shift;
41     my $self = bless { name => $name, ip => $ip, @_ }, $class;
42     $self->{maxjobs} = new Coro::Semaphore $self->{maxjobs} || 1;
43     $self;
44     }
45    
46     sub ip {
47     $_[0]{ip};
48     }
49    
50     sub sanitize {
51     $_[1];
52     }
53    
54     sub whois_request {
55     my ($self, $query) = @_;
56    
57 root 1.4 my $id = "$self->{name}\x0$query";
58     my $whois = $netgeo::whois{$id};
59    
60     unless (defined $whois) {
61     print "WHOIS($self->{name},$query)\n";
62 root 1.1
63     my $guard = $self->{maxjobs}->guard;
64     my $timeout = 5;
65    
66     while () {
67     my $fh = new Coro::Socket
68     PeerAddr => $self->ip,
69 root 1.10 PeerPort => $self->{port} || "whois",
70 root 1.1 Timeout => 30;
71     if ($fh) {
72     print $fh "$query\n";
73     $fh->read($whois, 16*1024); # max 16k. whois stored
74     close $fh;
75     $whois =~ s/\015?\012/\n/g;
76     $whois = $self->sanitize($whois);
77     if ($whois eq ""
78     or ($whois =~ /query limit/i && $whois =~ /exceeded/i) # ARIN
79     or ($whois =~ /wait a while and try again/i) # ARIN
80     or ($whois =~ /^%ERROR:202:/) # RIPE/APNIC
81     ) {
82     print "retrying in $timeout seconds\n";#d#
83     do_timer(desc => "timer2", after => $timeout);
84     $timeout *= 2;
85     $timeout = 1 if $timeout > 600;
86     } else {
87     last;
88     }
89 root 1.13 } else {
90     # only retry once a minute
91     print STDERR "unable to connect to $self->{ip} ($self->{name}), retrying...\n";
92 root 1.14 Coro::Timer::sleep 300;
93 root 1.1 }
94     }
95    
96 root 1.4 $netgeo::whois{$id} = $whois;
97 root 1.1 }
98    
99     $whois;
100     }
101    
102     package Whois::ARIN;
103    
104     use Date::Parse;
105    
106     use base Whois;
107    
108     sub sanitize {
109     local $_ = $_[1];
110     s/\n[\t ]{6,}([0-9.]+ - [0-9.]+)/ $1/g;
111     $_;
112     }
113    
114     # there are only two problems with arin's whois database:
115     # a) the data cannot be trusted and often is old or even wrong
116     # b) the database format is nonparsable
117     # (no spaces between netname/ip and netnames can end in digits ;)
118     # of course, the only source to find out about global
119     # address distribution is... arin.
120     sub ip_request {
121     my ($self, $ip) = @_;
122    
123     my $whois = $self->whois_request($ip);
124    
125 root 1.16 return if $whois =~ /^No match/;
126     return if $whois =~ /^\*de: This network range is not allocated to /; # APINIC e.g. 24.0.0.0
127 root 1.1
128     if ($whois =~ /^To single out one record/m) {
129     my $handle;
130     while ($whois =~ /\G\S.*\(([A-Z0-9\-]+)\).*\n/mg) {
131     $handle = $1;
132 root 1.16 #return if $handle =~ /-(RIPE|APNIC)/; # heuristic, but bad because ripe might not have better info
133 root 1.1 }
134     $handle or die "$whois ($ip): unparseable multimatch\n";
135     $whois = $self->whois_request("!$handle");
136     }
137    
138     my ($address, $info, $coordinator, undef) = split /\n\n/, $whois;
139    
140     $info =~ /^\s+Netname: (\S+)$/mi
141     or die "$whois($ip): no netname\n";
142     my $netname = $1;
143    
144     $info =~ /^\s+Netblock: ([0-9.]+\s+-\s+[0-9.]+)\s*$/mi
145     or die "$whois($ip): no netblock\n";
146     my $netblock = $1;
147    
148     my $maintainer;
149    
150     if ($info =~ /^\s+Maintainer: (\S+)\s*$/mi) {
151     $maintainer = "*ma: $1\n";
152     return if $1 =~ /^(?:AP|RIPE)$/;
153     }
154    
155     $coordinator =~ s/^\s+Coordinator:\s*//si
156     or $coordinator = "";
157    
158     $address =~ s/\n\s*(\S+)$//
159     or die "$whois($ip): no parseable country ($address)\n";
160     my $country = $1;
161    
162     $address =~ s/^\s*/*de: /mg;
163     $coordinator =~ s/^\s*/*ad: /mg;
164    
165     $whois = <<EOF;
166     *in: $netblock
167     *na: $netname
168     *cy: $country
169     $maintainer$address
170     $coordinator
171     EOF
172     $whois =~ s/\n+$//;
173     $whois;
174     }
175    
176     package Whois::RIPE;
177    
178 root 1.10 use Socket;
179 root 1.1 use base Whois;
180    
181     sub sanitize {
182     local $_ = $_[1];
183 root 1.10
184 root 1.1 s/^%.*\n//gm;
185     s/^\n+//;
186     s/\n*$/\n/;
187 root 1.10
188     s/^inetnum:\s+/*in: /gm;
189     s/^admin-c:\s+/*ac: /gm;
190     s/^tech-c:\s+/*tc: /gm;
191     s/^owner-c:\s+/*oc: /gm;
192     s/^country:\s+/*cy: /gm;
193     s/^phone:\s+/*ph: /gm;
194 root 1.12 s/^remarks:\s+/*rm: /gm;
195 root 1.10 s/^changed:\s+/*ch: /gm;
196     s/^created:\s+/*cr: /gm;
197     s/^address:\s+/*ad: /gm;
198     s/^status:\s+/*st: /gm;
199     s/^inetrev:\s+/*ir: /gm;
200     s/^nserver:\s+/*ns: /gm;
201    
202     $_;
203     }
204    
205     sub ip_request {
206     my ($self, $ip) = @_;
207    
208     my $whois = $self->whois_request("$self->{rflags}$ip");
209    
210     $whois =~ s{
211     (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
212     (?:\.
213     (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
214     (?:\.
215     (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
216     (?:\.
217     (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
218     )?
219     )?
220     )?
221     /
222     ([0-9]+)
223     }{
224     my $ip = inet_aton sprintf "%d.%d.%d.%d", $1, $2, $3, $4;
225     my $net = 1 << (31 - $5);
226     my $mask = inet_aton 2 ** 32 - $net;
227    
228     my $ip1 = $ip & $mask;
229     my $ip2 = $ip1 | inet_aton $net * 2 - 1;
230     (inet_ntoa $ip1) . " - " . (inet_ntoa $ip2);
231     }gex;
232    
233     $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/
234     and return;
235    
236     $whois =~ /^\*ac: XXX0/m # 192.0.0.0
237     and return;
238    
239     $whois =~ /^\*st: (?:ALLOCATED )?UNSPECIFIED/m
240     and return;
241    
242     $whois =~ /^%ERROR:/m
243     and return;
244    
245     #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) {
246     # $whois .= $self->whois_request("-FSTpn $1");
247     #}
248    
249     #$whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg;
250    
251     $whois =~ s/\n+$//;
252    
253     $whois;
254     }
255    
256     package Whois::RWHOIS;
257    
258     use base Whois;
259    
260     sub sanitize {
261     local $_ = $_[1];
262     s/^%referral\s+/referral:/gm;
263     s/^network://gm;
264     s/^%.*\n//gm;
265     s/^\n+//m;
266     s/\n*$/\n/m;
267    
268     s/^(\S+):\s*/\L$1: /gm;
269     s/^ip-network-block:/*in:/gm;
270     s/^country-code:/*cy:/gm;
271     s/^tech-contact;i:/*tc:/gm;
272     s/^updated:/*ch:/gm;
273     s/^street-address:/*ad:/gm;
274 root 1.12 s/^org-name:/*rm:/gm;
275 root 1.10 s/^created:/*cr:/gm;
276    
277 root 1.1 $_;
278     }
279    
280     sub ip_request {
281     my ($self, $ip) = @_;
282    
283 root 1.10 my $whois = $self->whois_request("$ip");
284 root 1.1
285     $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/
286     and return;
287    
288     $whois =~ /^\*ac: XXX0/m # 192.0.0.0
289     and return;
290    
291     $whois =~ /^%ERROR:/m
292     and return;
293    
294     #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) {
295     # $whois .= $self->whois_request("-FSTpn $1");
296     #}
297    
298     $whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg;
299    
300     $whois =~ s/\n+$//;
301    
302     $whois;
303     }
304    
305 root 1.4 package netgeo;
306    
307     use Socket;
308 root 1.8 use BerkeleyDB;
309 root 1.1
310     sub ip2int($) {
311     unpack "N", inet_aton $_[0];
312     }
313    
314     sub int2ip($) {
315     inet_ntoa pack "N", $_[0];
316     }
317    
318     our %WHOIS;
319    
320 root 1.10 #$WHOIS{ARIN} = new Whois::ARIN ARIN => "whois.arin.net", port => 43, maxjobs => 12;
321     $WHOIS{ARIN} = new Whois::RWHOIS ARIN => "rwhois.arin.net", port => 4321, maxjobs => 12;
322 root 1.15 $WHOIS{RIPE} = new Whois::RIPE RIPE => "whois.ripe.net", port => 43, rflags => "-FTin ", maxjobs => 20;
323     $WHOIS{APNIC} = new Whois::RIPE APNIC => "whois.apnic.net", port => 43, rflags => "-FTin ", maxjobs => 20;
324 root 1.10 $WHOIS{LACNIC} = new Whois::RIPE LACNIC => "whois.lacnic.net", port => 43, maxjobs => 20;
325 root 1.1
326 root 1.6 $whoislock = new Coro::SemaphoreSet;
327    
328 root 1.1 sub ip_request {
329     my $ip = $_[0];
330 root 1.6
331     my $guard = $whoislock->guard($ip);
332 root 1.1
333 root 1.4 my $c = $iprange->db_cursor;
334     my $v;
335    
336     if (!$c->c_get((inet_aton $ip), $v, DB_SET_RANGE)) {
337     my ($ip0, $ip1, $whois) = split /\x0/, $v;
338     my $_ip = ip2int $ip;
339     if ($ip0 <= $_ip && $_ip <= $ip1) {
340     return $whois;
341 root 1.1 }
342 root 1.4 }
343    
344     my ($arin, $ripe, $apnic);
345    
346 root 1.9 $whois = $WHOIS{RIPE}->ip_request($ip)
347 root 1.10 || $WHOIS{APNIC} ->ip_request($ip)
348 root 1.9 || $WHOIS{ARIN} ->ip_request($ip)
349 root 1.15 # || $WHOIS{LACNIC}->ip_request($ip)
350 root 1.10 ;
351 root 1.1
352 root 1.4 $whois =~ /^\*in: ([0-9.]+)\s+-\s+([0-9.]+)\s*$/mi
353     or do { warn "$whois($ip): no addresses found\n", last };
354 root 1.1
355 root 1.4 my ($ip0, $ip1) = ($1, $2);
356    
357     my $_ip = ip2int($ip);
358     my $_ip0 = ip2int($ip0);
359     my $_ip1 = ip2int($ip1);
360    
361     if ($_ip0 + 256 < $_ip1) {
362     $_ip = $_ip & 0xffffff00;
363     $_ip0 = $_ip if $_ip0 < $_ip;
364     $_ip1 = $_ip + 255 if $_ip1 > $_ip + 255;
365 root 1.1 }
366 root 1.4
367     $iprange->db_put((pack "N", $_ip1), (join "\x0", $_ip0, $_ip1, $whois));
368     (tied %whois)->db_sync;
369     $iprange->db_sync;
370 root 1.1
371     $whois;
372 root 1.10 }
373    
374     if (0) {
375     #print ip_request "68.52.164.8"; # goof
376     #print "\n\n";
377     #print ip_request "200.202.220.222"; # lacnic
378     #print "\n\n";
379     #print ip_request "62.116.167.250";
380     #print "\n\n";
381     #print ip_request "133.11.128.254"; # jp
382     #print "\n\n";
383 root 1.15 print ip_request "80.131.153.93";
384     print "\n\n";
385 root 1.1 }
386    
387 root 1.11 1;
388 root 1.1
389