ViewVC Help
View File | Revision Log | Show Annotations | Download File
/cvs/Coro/myhttpd/netgeo.pl
(Generate patch)

Comparing Coro/myhttpd/netgeo.pl (file contents):
Revision 1.4 by root, Tue Aug 28 02:30:49 2001 UTC vs.
Revision 1.16 by root, Sat Sep 17 20:21:11 2005 UTC

6use Fcntl; 6use Fcntl;
7 7
8use Coro; 8use Coro;
9use Coro::Event; 9use Coro::Event;
10use Coro::Semaphore; 10use Coro::Semaphore;
11use Coro::SemaphoreSet;
11use Coro::Socket; 12use Coro::Socket;
13use Coro::Timer;
14
15use BerkeleyDB;
12 16
13$Event::DIED = sub { 17$Event::DIED = sub {
14 Event::verbose_exception_handler(@_); 18 Event::verbose_exception_handler(@_);
15 #Event::unloop_all(); 19 #Event::unloop_all();
16}; 20};
60 my $timeout = 5; 64 my $timeout = 5;
61 65
62 while () { 66 while () {
63 my $fh = new Coro::Socket 67 my $fh = new Coro::Socket
64 PeerAddr => $self->ip, 68 PeerAddr => $self->ip,
65 PeerPort => 'whois', 69 PeerPort => $self->{port} || "whois",
66 Timeout => 30; 70 Timeout => 30;
67 if ($fh) { 71 if ($fh) {
68 print $fh "$query\n"; 72 print $fh "$query\n";
69 $fh->read($whois, 16*1024); # max 16k. whois stored 73 $fh->read($whois, 16*1024); # max 16k. whois stored
70 close $fh; 74 close $fh;
80 $timeout *= 2; 84 $timeout *= 2;
81 $timeout = 1 if $timeout > 600; 85 $timeout = 1 if $timeout > 600;
82 } else { 86 } else {
83 last; 87 last;
84 } 88 }
89 } else {
90 # only retry once a minute
91 print STDERR "unable to connect to $self->{ip} ($self->{name}), retrying...\n";
92 Coro::Timer::sleep 300;
85 } 93 }
86 } 94 }
87 95
88 $netgeo::whois{$id} = $whois; 96 $netgeo::whois{$id} = $whois;
89 } 97 }
112sub ip_request { 120sub ip_request {
113 my ($self, $ip) = @_; 121 my ($self, $ip) = @_;
114 122
115 my $whois = $self->whois_request($ip); 123 my $whois = $self->whois_request($ip);
116 124
117 return () if $whois =~ /^No match/; 125 return if $whois =~ /^No match/;
126 return if $whois =~ /^\*de: This network range is not allocated to /; # APINIC e.g. 24.0.0.0
118 127
119 if ($whois =~ /^To single out one record/m) { 128 if ($whois =~ /^To single out one record/m) {
120 my $handle; 129 my $handle;
121 while ($whois =~ /\G\S.*\(([A-Z0-9\-]+)\).*\n/mg) { 130 while ($whois =~ /\G\S.*\(([A-Z0-9\-]+)\).*\n/mg) {
122 $handle = $1; 131 $handle = $1;
123 #return if $handle =~ /-(RIPE|APNIC)/; # heuristic, bbut bad because ripe might not have better info 132 #return if $handle =~ /-(RIPE|APNIC)/; # heuristic, but bad because ripe might not have better info
124 } 133 }
125 $handle or die "$whois ($ip): unparseable multimatch\n"; 134 $handle or die "$whois ($ip): unparseable multimatch\n";
126 $whois = $self->whois_request("!$handle"); 135 $whois = $self->whois_request("!$handle");
127 } 136 }
128 137
164 $whois; 173 $whois;
165} 174}
166 175
167package Whois::RIPE; 176package Whois::RIPE;
168 177
178use Socket;
169use base Whois; 179use base Whois;
170 180
171sub sanitize { 181sub sanitize {
172 local $_ = $_[1]; 182 local $_ = $_[1];
183
173 s/^%.*\n//gm; 184 s/^%.*\n//gm;
174 s/^\n+//; 185 s/^\n+//;
175 s/\n*$/\n/; 186 s/\n*$/\n/;
187
188 s/^inetnum:\s+/*in: /gm;
189 s/^admin-c:\s+/*ac: /gm;
190 s/^tech-c:\s+/*tc: /gm;
191 s/^owner-c:\s+/*oc: /gm;
192 s/^country:\s+/*cy: /gm;
193 s/^phone:\s+/*ph: /gm;
194 s/^remarks:\s+/*rm: /gm;
195 s/^changed:\s+/*ch: /gm;
196 s/^created:\s+/*cr: /gm;
197 s/^address:\s+/*ad: /gm;
198 s/^status:\s+/*st: /gm;
199 s/^inetrev:\s+/*ir: /gm;
200 s/^nserver:\s+/*ns: /gm;
201
176 $_; 202 $_;
177} 203}
178 204
179sub ip_request { 205sub ip_request {
180 my ($self, $ip) = @_; 206 my ($self, $ip) = @_;
181 207
182 my $whois = $self->whois_request("-FSTin $ip"); 208 my $whois = $self->whois_request("$self->{rflags}$ip");
209
210 $whois =~ s{
211 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
212 (?:\.
213 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
214 (?:\.
215 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
216 (?:\.
217 (2[0-5][0-9]|1[0-9][0-9]|[1-9][0-9]|[0-9])
218 )?
219 )?
220 )?
221 /
222 ([0-9]+)
223 }{
224 my $ip = inet_aton sprintf "%d.%d.%d.%d", $1, $2, $3, $4;
225 my $net = 1 << (31 - $5);
226 my $mask = inet_aton 2 ** 32 - $net;
227
228 my $ip1 = $ip & $mask;
229 my $ip2 = $ip1 | inet_aton $net * 2 - 1;
230 (inet_ntoa $ip1) . " - " . (inet_ntoa $ip2);
231 }gex;
183 232
184 $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/ 233 $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/
185 and return; 234 and return;
186 235
187 $whois =~ /^\*ac: XXX0/m # 192.0.0.0 236 $whois =~ /^\*ac: XXX0/m # 192.0.0.0
237 and return;
238
239 $whois =~ /^\*st: (?:ALLOCATED )?UNSPECIFIED/m
188 and return; 240 and return;
189 241
190 $whois =~ /^%ERROR:/m 242 $whois =~ /^%ERROR:/m
191 and return; 243 and return;
192 244
193 #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) { 245 #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) {
194 # $whois .= $self->whois_request("-FSTpn $1"); 246 # $whois .= $self->whois_request("-FSTpn $1");
195 #} 247 #}
196 248
249 #$whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg;
250
251 $whois =~ s/\n+$//;
252
253 $whois;
254}
255
256package Whois::RWHOIS;
257
258use base Whois;
259
260sub sanitize {
261 local $_ = $_[1];
262 s/^%referral\s+/referral:/gm;
263 s/^network://gm;
264 s/^%.*\n//gm;
265 s/^\n+//m;
266 s/\n*$/\n/m;
267
268 s/^(\S+):\s*/\L$1: /gm;
269 s/^ip-network-block:/*in:/gm;
270 s/^country-code:/*cy:/gm;
271 s/^tech-contact;i:/*tc:/gm;
272 s/^updated:/*ch:/gm;
273 s/^street-address:/*ad:/gm;
274 s/^org-name:/*rm:/gm;
275 s/^created:/*cr:/gm;
276
277 $_;
278}
279
280sub ip_request {
281 my ($self, $ip) = @_;
282
283 my $whois = $self->whois_request("$ip");
284
285 $whois =~ /^\*in: 0\.0\.0\.0 - 255\.255\.255\.255/
286 and return;
287
288 $whois =~ /^\*ac: XXX0/m # 192.0.0.0
289 and return;
290
291 $whois =~ /^%ERROR:/m
292 and return;
293
294 #while ($whois =~ s/^\*(?:ac|tc):\s+(\S+)\n//m) {
295 # $whois .= $self->whois_request("-FSTpn $1");
296 #}
297
197 $whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg; 298 $whois =~ s/^\*(?:pn|nh|mb|ch|so|rz|ny|st|rm):.*\n//mg;
198 299
199 $whois =~ s/\n+$//; 300 $whois =~ s/\n+$//;
200 301
201 $whois; 302 $whois;
202} 303}
203 304
204package netgeo; 305package netgeo;
205 306
307use Socket;
206use BerkeleyDB; 308use BerkeleyDB;
207use Socket;
208 309
209sub ip2int($) { 310sub ip2int($) {
210 unpack "N", inet_aton $_[0]; 311 unpack "N", inet_aton $_[0];
211} 312}
212 313
214 inet_ntoa pack "N", $_[0]; 315 inet_ntoa pack "N", $_[0];
215} 316}
216 317
217our %WHOIS; 318our %WHOIS;
218 319
219$WHOIS{ARIN} = new Whois::ARIN ARIN => "whois.arin.net", maxjobs => 12; 320#$WHOIS{ARIN} = new Whois::ARIN ARIN => "whois.arin.net", port => 43, maxjobs => 12;
321$WHOIS{ARIN} = new Whois::RWHOIS ARIN => "rwhois.arin.net", port => 4321, maxjobs => 12;
220$WHOIS{RIPE} = new Whois::RIPE RIPE => "whois.ripe.net", maxjobs => 20; 322$WHOIS{RIPE} = new Whois::RIPE RIPE => "whois.ripe.net", port => 43, rflags => "-FTin ", maxjobs => 20;
323$WHOIS{APNIC} = new Whois::RIPE APNIC => "whois.apnic.net", port => 43, rflags => "-FTin ", maxjobs => 20;
221$WHOIS{APNIC} = new Whois::RIPE APNIC => "whois.apnic.net", maxjobs => 20; 324$WHOIS{LACNIC} = new Whois::RIPE LACNIC => "whois.lacnic.net", port => 43, maxjobs => 20;
325
326$whoislock = new Coro::SemaphoreSet;
222 327
223sub ip_request { 328sub ip_request {
224 my $ip = $_[0]; 329 my $ip = $_[0];
330
331 my $guard = $whoislock->guard($ip);
225 332
226 my $c = $iprange->db_cursor; 333 my $c = $iprange->db_cursor;
227 my $v; 334 my $v;
228 335
229 if (!$c->c_get((inet_aton $ip), $v, DB_SET_RANGE)) { 336 if (!$c->c_get((inet_aton $ip), $v, DB_SET_RANGE)) {
230 my ($ip0, $ip1, $whois) = split /\x0/, $v; 337 my ($ip0, $ip1, $whois) = split /\x0/, $v;
231 my $_ip = ip2int $ip; 338 my $_ip = ip2int $ip;
232 print "looked for $_ip, found $ip0, $ip1 ", length($v),"\n";
233 if ($ip0 <= $_ip && $_ip <= $ip1) { 339 if ($ip0 <= $_ip && $_ip <= $ip1) {
234 return $whois; 340 return $whois;
235 } 341 }
236 } 342 }
237 343
238 print "looked for $ip, ONLY found $v->[0], $v->[1]\n";
239
240 my ($arin, $ripe, $apnic); 344 my ($arin, $ripe, $apnic);
241 345
242 $whois = $WHOIS{APNIC}->ip_request($ip) 346 $whois = $WHOIS{RIPE}->ip_request($ip)
243 || $WHOIS{RIPE} ->ip_request($ip) 347 || $WHOIS{APNIC} ->ip_request($ip)
244 || $WHOIS{ARIN} ->ip_request($ip); 348 || $WHOIS{ARIN} ->ip_request($ip)
349# || $WHOIS{LACNIC}->ip_request($ip)
350 ;
245 351
246 $whois =~ /^\*in: ([0-9.]+)\s+-\s+([0-9.]+)\s*$/mi 352 $whois =~ /^\*in: ([0-9.]+)\s+-\s+([0-9.]+)\s*$/mi
247 or do { warn "$whois($ip): no addresses found\n", last }; 353 or do { warn "$whois($ip): no addresses found\n", last };
248 354
249 my ($ip0, $ip1) = ($1, $2); 355 my ($ip0, $ip1) = ($1, $2);
256 $_ip = $_ip & 0xffffff00; 362 $_ip = $_ip & 0xffffff00;
257 $_ip0 = $_ip if $_ip0 < $_ip; 363 $_ip0 = $_ip if $_ip0 < $_ip;
258 $_ip1 = $_ip + 255 if $_ip1 > $_ip + 255; 364 $_ip1 = $_ip + 255 if $_ip1 > $_ip + 255;
259 } 365 }
260 366
261 print "setting entry ($_ip0, $_ip, $_ip1)\n";
262 $iprange->db_put((pack "N", $_ip1), (join "\x0", $_ip0, $_ip1, $whois)); 367 $iprange->db_put((pack "N", $_ip1), (join "\x0", $_ip0, $_ip1, $whois));
263 (tied %whois)->db_sync; 368 (tied %whois)->db_sync;
264 $iprange->db_sync; 369 $iprange->db_sync;
265 370
266 $whois; 371 $whois;
267} 372}
268 373
374if (0) {
375 #print ip_request "68.52.164.8"; # goof
376 #print "\n\n";
377 #print ip_request "200.202.220.222"; # lacnic
378 #print "\n\n";
379 #print ip_request "62.116.167.250";
380 #print "\n\n";
381 #print ip_request "133.11.128.254"; # jp
382 #print "\n\n";
383 print ip_request "80.131.153.93";
384 print "\n\n";
385}
269 386
3871;
270 388
389

Diff Legend

Removed lines
+ Added lines
< Changed lines
> Changed lines