访问量分类统计(QQ,微信,微博,网页,网站APP,其他)
刚准备敲键盘,突然想起今天已经星期五了,有点小兴奋,一周又这么愉快的结束,又可以休息了,等等。。我好像是来写Java博客的,怎么变成了写日记,好吧,言归正传。
不知道大家有没有遇到过这样的需求:统计一遍文章的浏览量并且分析出详情,即QQ,微信,微博,网页,网站APP,其他的访问比率,我们公司前一段时间遇到了这样的需求,那么我接下来讲解一下它的具体实现。
首先需要统计一篇文章的访问量,这里的访问量是精确访问量(登陆的用户多次访问,记多次算一人,游客根据ip统计,同一ip算一人),下面是获取ip的代码实现:
public static String getIpAddr(Request request) { /* String ip = request.getHeader( " x-forwarded-for " ); if (ip == null || ip.length() == 0 || " unknown " .equalsIgnoreCase(ip)) { ip = request.getHeader( " Proxy-Client-IP " ); } if (ip == null || ip.length() == 0 || " unknown " .equalsIgnoreCase(ip)) { ip = request.getHeader( " WL-Proxy-Client-IP " ); } if (ip == null || ip.length() == 0 || " unknown " .equalsIgnoreCase(ip)) { ip = request.getRemoteAddr(); } if(ip.contains(",")){ ip = ip.substring(0, ip.indexOf(",")); } return ip; */ String ipAddress = null; //ipAddress = this.getRequest().getRemoteAddr(); ipAddress = request.getHeader("x-forwarded-for"); if (ipAddress == null || ipAddress.length() == 0 || "unknown".equalsIgnoreCase(ipAddress)) { ipAddress = request.getHeader("Proxy-Client-IP"); } if (ipAddress == null || ipAddress.length() == 0 || "unknown".equalsIgnoreCase(ipAddress)) { ipAddress = request.getHeader("WL-Proxy-Client-IP"); } if (ipAddress == null || ipAddress.length() == 0 || "unknown".equalsIgnoreCase(ipAddress)) { ipAddress = request.remoteAddress(); if (ipAddress.equals("127.0.0.1")) { //根据网卡取本机配置的IP InetAddress inet = null; try { inet = InetAddress.getLocalHost(); } catch (Exception e) { e.printStackTrace(); } ipAddress = inet.getHostAddress(); } } //对于通过多个代理的情况,第一个IP为客户端真实IP,多个IP按照','分割 if (ipAddress != null && ipAddress.length() > 15) { //"***.***.***.***".length() = 15 if (ipAddress.indexOf(",") > 0) { ipAddress = ipAddress.substring(0, ipAddress.indexOf(",")); } } return ipAddress; }
第二步,是在保存每条访问记录时进行访问来源的插入,比如是qq还是微信等等,如下是获取它的访问来源的具体代码实现:
/** * 获取浏览端的类型,0-网页,1;//微博 2;//qq 5;//微信 6;//APP 7;//其他 *@author LongJin * @return */ public static int getFromPc(String client) { Http.Context context = ctx(); Http.Request request = context.request(); String head = request.getHeader("user-agent").toLowerCase(); play.Logger.info("head = " + request.getHeader("user-agent")); int from = 0;//pc端 boolean isPc = HttpRequestDeviceUtils.isPcDevice(request);//判断是否来源于pc端 if (!isPc) { if (head.contains("weibo")) { from = 1;//微博 } else if (getQq(head)) {//qq单独写了个判断方法 from = 2;//qq } else if (head.contains("micromessenger")) { from = 5;//微信 } else if (StringUtils.isNotBlank(client)) { from = 6;//APP } else { from = 7;//其他 } } return from; }
判断是否是来源于QQ:
/** * 获取QQ * * @param str * @return */ public static boolean getQqCount(String str) { Pattern p = Pattern.compile("\\bqq\\b", Pattern.CASE_INSENSITIVE); Matcher m = p.matcher(str); boolean isQq= false; while (m.find()) { isQq = true; } return isQq; }
其中的HttpRequestDeviceUtils.isPcDevice(request)判断是否来源pc端实现如下:
/**Wap网关Via头信息中特有的描述信息*/ private static String mobileGateWayHeaders[]=new String[]{ "ZXWAP",//中兴提供的wap网关的via信息,例如:Via=ZXWAP GateWayZTE Technologies, "chinamobile.com",//中国移动的诺基亚wap网关,例如:Via=WTP/1.1 GDSZ-PB-GW003-WAP07.gd.chinamobile.com (Nokia WAP Gateway 4.1 CD1/ECD13_D/4.1.04) "monternet.com",//移动梦网的网关,例如:Via=WTP/1.1 BJBJ-PS-WAP1-GW08.bj1.monternet.com. (Nokia WAP Gateway 4.1 CD1/ECD13_E/4.1.05) "infoX",//华为提供的wap网关,例如:Via=HTTP/1.1 GDGZ-PS-GW011-WAP2 (infoX-WISG Huawei Technologies),或Via=infoX WAP Gateway V300R001 Huawei Technologies "XMS 724Solutions HTG",//国外电信运营商的wap网关,不知道是哪一家 "wap.lizongbo.com",//自己测试时模拟的头信息 "Bytemobile",//貌似是一个给移动互联网提供解决方案提高网络运行效率的,例如:Via=1.1 Bytemobile OSN WebProxy/5.1 }; /**电脑上的IE或Firefox浏览器等的User-Agent关键词*/ private static String[] pcHeaders=new String[]{ "Windows 98", "Windows ME", "Windows 2000", "Windows XP", "Windows NT", "Ubuntu", "Macintosh", "Linux" }; /**手机浏览器的User-Agent里的关键词*/ private static String[] mobileUserAgents=new String[]{ "Nokia",//诺基亚,有山寨机也写这个的,总还算是手机,Mozilla/5.0 (Nokia5800 XpressMusic)UC AppleWebkit(like Gecko) Safari/530 "SAMSUNG",//三星手机 SAMSUNG-GT-B7722/1.0+SHP/VPP/R5+Dolfin/1.5+Nextreaming+SMM-MMS/1.2.0+profile/MIDP-2.1+configuration/CLDC-1.1 "MIDP-2",//j2me2.0,Mozilla/5.0 (SymbianOS/9.3; U; Series60/3.2 NokiaE75-1 /110.48.125 Profile/MIDP-2.1 Configuration/CLDC-1.1 ) AppleWebKit/413 (KHTML like Gecko) Safari/413 "CLDC1.1",//M600/MIDP2.0/CLDC1.1/Screen-240X320 "SymbianOS",//塞班系统的, "MAUI",//MTK山寨机默认ua "UNTRUSTED/1.0",//疑似山寨机的ua,基本可以确定还是手机 "Windows CE",//Windows CE,Mozilla/4.0 (compatible; MSIE 6.0; Windows CE; IEMobile 7.11) "iPhone",//iPhone是否也转wap?不管它,先区分出来再说。Mozilla/5.0 (iPhone; U; CPU iPhone OS 4_1 like Mac OS X; zh-cn) AppleWebKit/532.9 (KHTML like Gecko) Mobile/8B117 "iPad",//iPad的ua,Mozilla/5.0 (iPad; U; CPU OS 3_2 like Mac OS X; zh-cn) AppleWebKit/531.21.10 (KHTML like Gecko) Version/4.0.4 Mobile/7B367 Safari/531.21.10 "Android",//Android是否也转wap?Mozilla/5.0 (Linux; U; Android 2.1-update1; zh-cn; XT800 Build/TITA_M2_16.22.7) AppleWebKit/530.17 (KHTML like Gecko) Version/4.0 Mobile Safari/530.17 "BlackBerry",//BlackBerry8310/2.7.0.106-4.5.0.182 "UCWEB",//ucweb是否只给wap页面? Nokia5800 XpressMusic/UCWEB7.5.0.66/50/999 "ucweb",//小写的ucweb貌似是uc的代理服务器Mozilla/6.0 (compatible; MSIE 6.0;) Opera ucweb-squid "BREW",//很奇怪的ua,例如:REW-Applet/0x20068888 (BREW/3.1.5.20; DeviceId: 40105; Lang: zhcn) ucweb-squid "J2ME",//很奇怪的ua,只有J2ME四个字母 "YULONG",//宇龙手机,YULONG-CoolpadN68/10.14 IPANEL/2.0 CTC/1.0 "YuLong",//还是宇龙 "COOLPAD",//宇龙酷派YL-COOLPADS100/08.10.S100 POLARIS/2.9 CTC/1.0 "TIANYU",//天语手机TIANYU-KTOUCH/V209/MIDP2.0/CLDC1.1/Screen-240X320 "TY-",//天语,TY-F6229/701116_6215_V0230 JUPITOR/2.2 CTC/1.0 "K-Touch",//还是天语K-Touch_N2200_CMCC/TBG110022_1223_V0801 MTK/6223 Release/30.07.2008 Browser/WAP2.0 "Haier",//海尔手机,Haier-HG-M217_CMCC/3.0 Release/12.1.2007 Browser/WAP2.0 "DOPOD",//多普达手机 "Lenovo",// 联想手机,Lenovo-P650WG/S100 LMP/LML Release/2010.02.22 Profile/MIDP2.0 Configuration/CLDC1.1 "LENOVO",// 联想手机,比如:LENOVO-P780/176A "HUAQIN",//华勤手机 "AIGO-",//爱国者居然也出过手机,AIGO-800C/2.04 TMSS-BROWSER/1.0.0 CTC/1.0 "CTC/1.0",//含义不明 "CTC/2.0",//含义不明 "CMCC",//移动定制手机,K-Touch_N2200_CMCC/TBG110022_1223_V0801 MTK/6223 Release/30.07.2008 Browser/WAP2.0 "DAXIAN",//大显手机DAXIAN X180 UP.Browser/6.2.3.2(GUI) MMP/2.0 "MOT-",//摩托罗拉,MOT-MOTOROKRE6/1.0 LinuxOS/2.4.20 Release/8.4.2006 Browser/Opera8.00 Profile/MIDP2.0 Configuration/CLDC1.1 Software/R533_G_11.10.54R "SonyEricsson",// 索爱手机,SonyEricssonP990i/R100 Mozilla/4.0 (compatible; MSIE 6.0; Symbian OS; 405) Opera 8.65 [zh-CN] "GIONEE",//金立手机 "HTC",//HTC手机 "ZTE",//中兴手机,ZTE-A211/P109A2V1.0.0/WAP2.0 Profile "HUAWEI",//华为手机, "webOS",//palm手机,Mozilla/5.0 (webOS/1.4.5; U; zh-CN) AppleWebKit/532.2 (KHTML like Gecko) Version/1.0 Safari/532.2 Pre/1.0 "GoBrowser",//3g GoBrowser.User-Agent=Nokia5230/GoBrowser/2.0.290 Safari "IEMobile",//Windows CE手机自带浏览器, "WAP2.0"//支持wap 2.0的 }; /** * 判断是否为pc端 * @param request * @return */ public static boolean isPcDevice(Request request){ boolean b = false; boolean pcFlag = false; boolean mobileFlag = false; String via = request.getHeader("Via"); String userAgent = request.getHeader("user-agent"); //String xMsisdn = request.getHeader("X-MSISDN"); /* Map<String, String[]> headers = request.headers(); play.Logger.info("xM = "+headers);*/ for (int i = 0; userAgent!=null && !userAgent.trim().equals("") && i < pcHeaders.length; i++) { if(userAgent.contains(pcHeaders[i])){ pcFlag = true; break; } } for (int i = 0; via!=null && !via.trim().equals("") && i < mobileGateWayHeaders.length; i++) { if(via.contains(mobileGateWayHeaders[i])){ mobileFlag = true; break; } } for (int i = 0;!mobileFlag && userAgent!=null && !userAgent.trim().equals("") && i < mobileUserAgents.length; i++) { if(userAgent.contains(mobileUserAgents[i])){ mobileFlag = true; break; } } if(mobileFlag==false && pcFlag==true){ b=true; } return b; }
至此,访问量的分类就基本算是完成了,可以结合访问量的统计实现原创文章排行榜功能并且统计详情做成饼状图,写着写着突然断电了,可能是要放假了,激动了。
ps:这里只是讲解一些核心部分,至于具体详细实现没做讲解。在我实现的整个过程中,存在一个统计量精度问题,即统一局域网下外网一样,这样导致了在统计访问量时存在同一局域网下访问只算一人,望大神指点。