NAME
Simple::IPInfo - Get IP/IPList Info (location, as number, etc)
给定IP列表,查对应的区域信息,或AS号
SYNOPSIS
use Simple::IPInfo;
use Data::Dumper;
use utf8;
my $rr_loc = get_ip_loc([ [ '202.38.64.10'], ['202.96.196.33'] ]);
my $inet_rr_loc = get_ip_loc([ ['3395339297'], ['3391504394'] ]);
print Dumper($rr_loc, $inet_rr_loc);
my $rr_asn = get_ip_as([ [ '202.38.64.10'], ['202.96.196.33'] ], reserve_inet=>1);
print Dumper($rr_asn);
my $arr = [ [qw/202.38.64.10 xxx/], [qw/8.8.8.8 yyy/], ];
my $r = get_ipinfo(
$arr,
i => 0,
write_file => '02.ip_loc.csv',
sep => ',',
charset => 'utf8',
return_arrayref => 1,
ipinfo_names => [qw/country area isp country_code area_code isp_code/],
write_head => [qw/ip some country area isp country_code area_code isp_code/ ],
);
print Dumper($r);
DESCRIPTION
default ip as data: ftp://routeviews.org/dnszones/originas.bz2
default ip location data: http://ip.taobao.com
use iso 3166 country_code, subdivision_1 code, isp shortcut name
METHOD
get_ip_loc
get ip location, with country, area, isp, country_code, area_code, isp_code
返回IP区域信息,包括国家、省份、运营商,及其英文iso3166编号
get_ip_as
get ip as number
返回IP的AS号
get_ipinfo
get ip info, with specified ipinfo_file
iterate_ipinfo
add ipinfo to inet-sorted arrayref, for large file
Note that, lines are inet-sorted
use Simple::IPInfo;
use Data::Dumper;
my $arr = [ [qw/8.8.8.8 yyy/], [qw/202.38.64.10 xxx/], ];
my $r = iterate_ipinfo(
$arr, # or some big inet-sorted file : $big_inet_sorted_csv,
i => 0,
write_file => '02.ip_loc.csv',
sep => ',',
charset => 'utf8',
return_arrayref => 1,
ipinfo_names => [qw/country area isp country_code area_code isp_code/],
write_head => [qw/ip some country area isp country_code area_code isp_code/ ],
);
print Dumper($r);
my $inet_arr = [['3391504394' , 'ceshi'], [ '3395339297', 'test'], ];
my $r = iterate_ipinfo(
$inet_arr,
i=>0,
write_file => '02.inet_loc.csv',
sep => ',',
charset => 'utf8',
return_arrayref => 1,
ipinfo_names => [qw/country area isp country_code area_code isp_code/],
write_head => [qw/inet some country area isp country_code area_code isp_code/ ],
);
print Dumper($r);
ATTR
DEBUG
set $Simple::IPInfo::DEBUG = 1 for more details
BIN
csv is in xt/ directory
add_inet.pl
$ add_inet.pl -f 02.ip_raw.csv -i 0 -d 02.ip_inet.csv
$ sort -t, -k3 -n 02.ip_inet.csv > 02.ip_inet.sort.csv
add_ip_info.pl
$ add_ip_info.pl -f 02.ip_inet.sort.csv -d 02.add_ip_info.csv -i 0 -t loc
-f : source file 源文件, inet-sorted
-d : dest file 目标文件
-i : ip is in cloumn x, ip在第x列
-H : skip head or not,default is 0 (not skip) 默认不跳过首行
-t : loc or as, default is loc;添加信息类型,默认是加loc信息,也可指定为as
-s : sep character, default is ',' 默认分隔符为逗号
make_inet_from_cidr.pl
make_inet_from_cidr.pl [src_file] [dst_file]
$ pip install csvkit
$ cd xt/data/
$ csvcut -c network,isp,autonomous_system_number isp_cidr.csv > isp_cidr.csv.cut
$ make_inet_from_cidr.pl isp_cidr.csv.cut isp_inet.csv
$ csvcut -c network,geoname_id city_blocks_ipv4.csv > city_blocks_ipv4.csv.cut
$ csvcut -c geoname_id,country_iso_code,subdivision_1_iso_code,country_name,subdivision_1_name city_locations_zh-CN.csv > city_locations_zh-CN.csv.cut
$ csvjoin -c geoname_id city_blocks_ipv4.csv.cut city_locations_zh-CN.csv.cut |csvcut -C geoname_id > city_cidr.csv
$ make_inet_from_cidr.pl city_cidr.csv city_inet.csv
refine_inet.pl
refine_inet.pl [src_file] [dst_file]
src_file's inet is sorted by csvsort
$ csvsort isp_inet.csv > isp_inet.csv.sort
$ refine_inet.pl isp_inet.csv.sort isp_inet.csv.sort.refine
$ csvsort city_inet.csv > city_inet.csv.sort
$ refine_inet.pl city_inet.csv.sort city_inet.csv.sort.refine
merge_inet.pl
merge_inet.pl [src_inet_file1] [src_inet_file2] [dst_merge_file]
$ merge_inet.pl city_inet.csv.sort.refine isp_inet.csv.sort.refine merge_city_isp_inet.csv
XBIN
install: curl bunzip2 tar
get ip as data from routeviews.org
$ perl gen_inet_as.pl inet_as.csv
get ip loc from taobao
1) init data dir, and send ip query to taobao
ask_ip_loc_init.pl
ask_ip_loc.pl
2) merge data/*.csv to ip_loc_taobao.csv , tidy it, update old ip_loc.csv
$ perl ip_loc_taobao.pl
$ perl ip_loc_tidy.pl ip_loc_taobao.csv ip_loc_taobao.tidy.csv
$ perl ip_loc_update.pl ip_loc.csv ip_loc_taobao.tidy.csv ip_loc_update.csv
3) guess loc from as, update , write new ip_loc.csv
$ perl ip_loc_from_as.pl ip_loc_update.csv ip_loc_from_as.csv
$ perl ip_loc_update.pl ip_loc_update.csv ip_loc_from_as.csv ip_loc.csv
4) map into inet file, and refine inet_loc_src.csv
$ make_inet_from_cidr.pl ip_loc.csv inet_loc_raw.csv 'ip,country,area,isp'
$ refine_inet.pl inet_loc_raw.csv inet_loc_src.csv
5) add iso_3166 code for inet_loc_src.csv, use merge_file.pl from SimpleR::Reshape
inet_loc_src.csv : s, e , country, area, isp
inet_loc.csv : s, e , country, area, isp , country_code, area_code, isp_code
$ merge_file.pl -f country.csv -k 1 -v 0 -F inet_loc_src.csv -K 2 -o inet_loc.csv.c
$ merge_file.pl -f country_area.csv -k 0,3 -v 1 -F inet_loc.csv.c -K 5,3 -o inet_loc.csv.p
$ merge_file.pl -f country_isp.csv -k 0,3 -v 1 -F inet_loc.csv.p -K 5,4 -o inet_loc.csv
AUTHOR
Abby Pan <abbypan@gmail.com>
Thanks to Gabor Szabo <szabgab@gmail.com>, Neil Bowers <neil@bowers.com>