纯真IP地址数据库qqwry.dat解析
ip地址數據庫,在現在互聯網時代非常有用,比如大型網站的用戶安全保護系統,就常常會根據ip反查的信息,甄別賬號的一些不安全登錄行為,比如跨區域登錄問題等。ip其實關聯了一些有信息,比如區域,所在運營商,一些收錄全的,甚至包括具體經緯度,像百度的IP定位api就比較全。下面來介紹一下“ 純真IP地址數據庫qqwry”的格式以及解析
以下是“ 純真IP地址數據庫qqwry”官網對其的介紹。
純真版IP地址數據庫是當前網絡上最權威、地址最精確、IP記錄以及網吧數據最多的IP地址數據庫。收集了包括中國電信、中國移動、中國聯通、鐵通、長城寬帶等各 ISP 的最新準確 IP 地址數據。通過大家的共同努力打造一個沒有未知數據,沒有錯誤數據的QQ IP。IP數據庫每5天更新一次,請大家定期更新最新的IP數據庫!
格式
+———-+
| 文件頭 | (8字節)
+———-+
| 記錄區 | (不定長)
+———-+
| 索引區 | (大小由文件頭決定)
+———-+
使用java語言解析的兩種思路:
-
使用內存映射文件方式讀取,使用java的MappedByteBuffer 將原數據文件映射到MappedByteBuffer對象中,然后通過MappedByteBuffer 提供的字節讀取方式實現ip的查找。搜索是在索引區使用二分法
-
使用byte數組讀取,及將二進制的數據庫信息全都按順序讀入到一個數組中,由于數據是有格式的,我們便可計算根據索引區和記錄區在數組中的位置,當查詢ip時,從數組中的索引區開始通過二分查找方式找到IP地址對應的國家和區域的位置,然后從數組中取出地區信息。
熱升級思路:
使用一個可調度的單線程的線程池,線程定時檢測qqwry.dat文件是否修改,若修改則重新將數據重新載入,載入過程可使用可重入鎖ReentrantLock來鎖住資源,避免在更新的過程中臟查詢
兩種解析方式的實現源碼如下:
方式一(MappedByteBuffer ):
方式二(數組方式):
package com.difeng.qqwry2; import java.io.ByteArrayOutputStream; import java.io.File; import java.io.FileInputStream; import java.io.IOException; import java.io.UnsupportedEncodingException; import java.util.concurrent.Executors; import java.util.concurrent.TimeUnit; import java.util.concurrent.locks.ReentrantLock; /*** @Description:ip定位(使用byte數據方式讀取)* @author:difeng* @date:2016年12月13日*/ public class IPLocation {private byte[] data;private long firstIndexOffset;private long lastIndexOffset;private long totalIndexCount;private static final byte REDIRECT_MODE_1 = 0x01;private static final byte REDIRECT_MODE_2 = 0x02;static final long IP_RECORD_LENGTH = 7;private static ReentrantLock lock = new ReentrantLock();private static Long lastModifyTime = 0L;public static boolean enableFileWatch = false;private File qqwryFile;public IPLocation(String filePath) throws Exception {this.qqwryFile = new File(filePath);load();if(enableFileWatch){watch();}}private void watch() {Executors.newScheduledThreadPool(1).scheduleAtFixedRate(new Runnable() {@Overridepublic void run() {long time = qqwryFile.lastModified();if (time > lastModifyTime) {lastModifyTime = time;try {load();System.out.println("reload");} catch (Exception e) {e.printStackTrace();}}}}, 1000L, 5000L, TimeUnit.MILLISECONDS);}private void load() throws Exception {lastModifyTime = qqwryFile.lastModified();ByteArrayOutputStream out = null;FileInputStream in = null;lock.lock();try {out = new ByteArrayOutputStream();byte[] b = new byte[1024];in = new FileInputStream(qqwryFile);while(in.read(b) != -1){out.write(b);}data = out.toByteArray();firstIndexOffset = read4ByteAsLong(0);lastIndexOffset = read4ByteAsLong(4);totalIndexCount = (lastIndexOffset - firstIndexOffset) / IP_RECORD_LENGTH + 1;in.close();out.close();} finally {try {if(out != null) {out.close();}if(in != null) {in.close();}} catch (IOException e) {e.printStackTrace();}lock.unlock();}}private long read4ByteAsLong(final int offset) {long val = data[offset] & 0xFF;val |= (data[offset + 1] << 8L) & 0xFF00L;val |= (data[offset + 2] << 16L) & 0xFF0000L;val |= (data[offset + 3] << 24L) & 0xFF000000L;return val;}private long read3ByteAsLong(final int offset) {long val = data[offset] & 0xFF;val |= (data[offset + 1] << 8) & 0xFF00;val |= (data[offset + 2] << 16) & 0xFF0000;return val;}private long search(long ip) {long low = 0;long high = totalIndexCount;long mid = 0;while(low <= high){mid = (low + high) >>> 1 ;long indexIP = read4ByteAsLong((int)(firstIndexOffset + (mid - 1) * IP_RECORD_LENGTH));long indexIPNext = read4ByteAsLong((int)(firstIndexOffset + mid * IP_RECORD_LENGTH));if(indexIP <= ip && ip < indexIPNext) {return read3ByteAsLong((int)(firstIndexOffset + (mid - 1) * IP_RECORD_LENGTH + 4));} else {if(ip > indexIP) {low = mid + 1;} else if (ip < indexIP) {high = mid - 1;}}}return -1;}public Location fetchIPLocation(String ip) {long numericIp = inet_pton(ip);lock.lock();long offset = search(numericIp);try{if(offset != -1) {return readIPLocation((int)offset);}} finally {lock.unlock();}return null;}private Location readIPLocation(final int offset) {final Location loc = new Location();try {byte redirectMode = data[offset + 4];if (redirectMode == REDIRECT_MODE_1) {long countryOffset = read3ByteAsLong((int)offset + 5);redirectMode = data[(int)countryOffset];if (redirectMode == REDIRECT_MODE_2) {final QQwryString country = readString((int)read3ByteAsLong((int)countryOffset + 1));loc.country = country.string;countryOffset = countryOffset + 4;} else {final QQwryString country = readString((int)countryOffset);loc.country = country.string;countryOffset += country.byteCountWithEnd;}loc.area = readArea((int)countryOffset);} else if (redirectMode == REDIRECT_MODE_2) {loc.country = readString((int)read3ByteAsLong((int)offset + 5)).string;loc.area = readArea((int)offset + 8);} else {final QQwryString country = readString((int)offset + 4);loc.country = country.string;loc.area = readArea((int)offset + 4 + country.byteCountWithEnd);}return loc;} catch (Exception e) {return null;}}private String readArea(final int offset) {byte redirectMode = data[offset];if (redirectMode == REDIRECT_MODE_1 || redirectMode == REDIRECT_MODE_2) {long areaOffset = read3ByteAsLong((int)offset + 1);if (areaOffset == 0) {return "";} else {return readString((int)areaOffset).string;}} else {return readString(offset).string;}}private QQwryString readString(int offset) {int pos = offset;final byte[] b = new byte[128];int i;for (i = 0, b[i] = data[pos++]; b[i] != 0; b[++i] = data[pos++]);try{return new QQwryString(new String(b,0,i,"GBK"),i + 1);} catch(UnsupportedEncodingException e) {return new QQwryString("",0);}}/*** @Description:“.”號分隔的字符串轉換為long類型的數字* @param ipStr * @return:long*/private static long inet_pton(String ipStr) {if(ipStr == null){throw new NullPointerException("ip不能為空");}String [] arr = ipStr.split("\\.");long ip = (Long.parseLong(arr[0]) & 0xFFL) << 24 & 0xFF000000L;ip |= (Long.parseLong(arr[1]) & 0xFFL) << 16 & 0xFF0000L;ip |= (Long.parseLong(arr[2]) & 0xFFL) << 8 & 0xFF00L;ip |= (Long.parseLong(arr[3]) & 0xFFL);return ip;}private class QQwryString{public final String string;public final int byteCountWithEnd;public QQwryString(final String string,final int byteCountWithEnd) {this.string = string;this.byteCountWithEnd = byteCountWithEnd;}@Overridepublic String toString() {return string;}} }以上為主要代碼,獲取全部代碼請點擊全部代碼
使用
final IPLocation ipLocation = new IPLocation(filePath); Location loc = ipl.fetchIPLocation("182.92.240.50"); System.out.printf("%s %s",loc.country,loc.area);格式改進
由于原格式中讀取地區記錄時采用重定向,有些繁瑣。去掉之后格式更簡單,國家和地區單獨存放,索引里分別記錄的國家和地區的地址。
新格式如下:
+----------+
| 文件頭 | (8字節)
+----------+
| 記錄區 | (不定長)
+----------+
| 索引區 | (大小由文件頭決定)
+----------+
文件頭:
+------------------------------+-----------------------------+
| first index position(4 bytes)|last index position(4 bytes) |
+------------------------------+-----------------------------+
記錄區:
+------------------+----------+------------------+----------+-----
| country1(n bytes)|\0(1 byte)| country2(n bytes)|\0(1 byte)|...
+------------------+----------+------------------+----------+-----
+------------------+----------+------------------+----------+-----
| area1(n bytes) |\0(1 byte)| area2(n bytes) |\0(1 byte)|...
+------------------+----------+------------------+----------+-----
索引區:
+------------+-------------------------+------------------------+
|ip1(4 bytes)|country position(3 bytes)| area position(3 bytes) |...
+------------+-------------------------+------------------------+
轉換方法:
相關連接:
qqwry下載: qqwry
全球ip地址庫(收費):IPLocation
?原文來源:https://www.jianshu.com/p/01d3c19738c2
總結
以上是生活随笔為你收集整理的纯真IP地址数据库qqwry.dat解析的全部內容,希望文章能夠幫你解決所遇到的問題。
- 上一篇: 人脸识别有哪些利与弊
- 下一篇: AI监测分析课堂背后的旷视科技:清华学霸