package com.alimama.quanjingmonitor.mdrillImport.parse.for416tmp;
import java.util.Date;
import java.util.concurrent.LinkedBlockingDeque;
import org.apache.log4j.Logger;
import com.alimama.mdrillImport.InvalidEntryException;
public class aplus_text extends com.alimama.mdrillImport.DataParser {
private static final long serialVersionUID = 1L;
public volatile long groupCreateerror = 0;
private static Logger LOG = Logger.getLogger(aplus_text.class);
private volatile long lines = 0;
private volatile long lines_sb = 0;
private volatile long lines_sb2 = 0;
private static long TS_MAX = 3600l * 24 * 31;
private volatile long laststartts = System.currentTimeMillis() / 1000 - TS_MAX;
private volatile long lastendts = System.currentTimeMillis() / 1000 + TS_MAX;
private volatile long timediff = System.currentTimeMillis();
private volatile long timediff2 = System.currentTimeMillis();
public static String formatRows(String[] clicklog) {
StringBuilder b = new StringBuilder();
for (int i = 0; i < clicklog.length; i++) {
b.append(i);
b.append("=");
b.append(String.valueOf(clicklog[i]));
b.append(",");
}
return b.toString();
}
@Override
public DataIter parseLine(String line) throws InvalidEntryException {
try {
if (line == null) {
return null;
}
this.lines++;
if (this.lines > 100000) {
this.laststartts = (System.currentTimeMillis() / 1000) - TS_MAX;
this.lastendts = (System.currentTimeMillis() / 1000) + TS_MAX;
this.lines = 0;
}
String[] log = line.split("\001", -1);
if (log == null||log.length<46) {
return null;
}
long ts = Long.parseLong(log[2]);
this.lines_sb++;
if (this.lines_sb > 5000) {
this.lines_sb = 0;
long nowts = System.currentTimeMillis();
if (nowts - timediff > 30000) {
timediff = nowts;
LOG.info("parseLine_sb_"
+ ColsDefine.formatDayMin.format(new Date(ts * 1000)) + " "
+ formatRows(log));
}
}
if (ts < laststartts || ts > lastendts) {
return null;
}
//--宋智给的格式--
// 0 version string,
// 1 ip string,
// 2 time string,
// 3 url string,
// 4 user_agent string,
// 5 linezing_session string,
// 6 cna string,
// 7 adid string,
// 8 amid string,
// 9 cmid string,
// 10 pmid string,
// 11 uid string,
// 12 sid string,
// 13 pre string,
// 14 cache_ string,
// 15 scr string,
// 16 nick string,
// 17 at_autype string,
// 18 bbid string,
// 19 at_isb string,
// 20 at_mall_pro_re string,
// 21 at_mall_re string,
// 22 at_shoptype string,
// 23 b2c_auction string,
// 24 b2c_brand string,
// 25 b2c_orid string,
// 26 at_type string,
// 27 category string,
// 28 marketinfo string,
// 29 atp_isdpp string,
// 30 at_bucketid string,
// 31 at_insid string,
// 32 at_jporid string,
// 33 upi_bi string,
// 34 rpi_bi string,
// 35 wm_pageid string,
// 36 wm_prototypeid string,
// 37 wm_sid string,
// 38 spm_cnt string,
// 39 title string,
// 40 url_type string,
// 41 ref_type string,
// 42 ref_shopid string,
// 43 parse_ip string,
// 44 parse_time string,
// 45 logkey string,
// 46 gmkey string,
// 47 gokey string,
// 48 logtype string,
// 49 atp_sid string,
// 50 userid string,
// 51 isbeta string,
// 52 spm_url string,
// 53 spm_pre string
// String url_pre_lwfrom = ColsDefine.getName(log[13], "lwfrom");
// if ((url_lwfrom == null || url_lwfrom.isEmpty())) {
// return null;
// }
DataIterParse rtn = new DataIterParse(ts, log,line);
if (!rtn.isvalidate()) {
this.lines_sb2++;
if (this.lines_sb2 > 5000) {
this.lines_sb2 = 0;
long nowts = System.currentTimeMillis();
if (nowts - timediff2 > 30000) {
timediff2 = nowts;
LOG.info("parseLine_text_"
+ ColsDefine.formatDayMin.format(new Date(
ts * 1000)) + " " + " "+line);
}
}
return null;
}
return rtn;
} catch (Throwable nfe) {
if (groupCreateerror < 100) {
LOG.error("InvalidEntryException:" + line, nfe);
groupCreateerror++;
}
throw new InvalidEntryException("Invalid log `" + line + "'\n", nfe);
}
}
public static class DataIterParse implements DataIter {
private long ts;
java.util.concurrent.LinkedBlockingDeque<pid_type> querylist = new LinkedBlockingDeque<aplus_text.DataIterParse.pid_type>();
public static class pid_type {
public String pid = "";
public String tid = "";
public String matchUrl="";
public boolean isshaoma;
}
pid_type curr = null;
private String fetch(boolean isshaoma,String type,String lwfrom, String strday) {
if (lwfrom == null || lwfrom.isEmpty()) {
return null;
}
if(isshaoma||type.equals("pc"))
{
return FetchAdid2PidPC.fetch().get(strday+"@"+String.valueOf(lwfrom));
}
return FetchAdid2PidWireLess.fetch().get(strday+"@"+String.valueOf(lwfrom));
}
public String matchType(String url)
{
if(url.indexOf("http://m.laiwang.com/market/laiwang/event-square.php")>=0)
{
return "pc";
}
if(url.indexOf("http://h5.m.taobao.com/laiwang/act/419/index.html")>=0)
{
return "wireless_huodong";
}
if(url.indexOf("http://m.laiwang.com/go/laiwang/419/index.php")>=0)
{
return "wireless_huodong";
}
if(url.indexOf("http://www.laiwang.com/event/share.htm")>=0)
{
return "wireless_zhadui";
}
if(url.indexOf("http://www.laiwang.com/event/feed.htm")>=0)
{
return "wireless_zhadui";
}
return null;
}
public void parseSaoma(String url_lwfrom)
{
String[] url_lwfrom_split=String.valueOf(url_lwfrom).split("_");
boolean isshaoma=url_lwfrom_split.length>2&&!url_lwfrom_split[2].isEmpty();
if(isshaoma)
{
String strday = ColsDefine.formatDay.format(new Date(ts * 1000));
String shaomaPid=this.fetch(true,"pc",url_lwfrom_split[0], strday);
if(shaomaPid!=null)
{
pid_type p = new pid_type();
p.isshaoma=true;
p.pid = shaomaPid;
p.matchUrl="pc";
querylist.add(p);
}
}
}
public void setPV2(String url_lwfrom,String Url)
{
String isMathchUrl = matchType(Url);
if(isMathchUrl==null)
{
return ;
}
String tid="";
String pid=null;
if("pc".equals(isMathchUrl))
{
String strday = ColsDefine.formatDay.format(new Date(ts * 1000));
pid = this.fetch(false,"pc",String.valueOf(url_lwfrom), strday);
}else{
pid=ColsDefine.getName(Url, "refpid");
tid=ColsDefine.getName(Url, "tid");
}
if(pid != null){
pid_type p = new pid_type();
p.isshaoma=false;
p.pid = pid;
p.tid = tid;
p.matchUrl=isMathchUrl;
querylist.add(p);
}
}
public DataIterParse(long ts, String[] pvlog,String line) {
this.ts = ts;
String Url = ColsDefine.decodeString(pvlog[3]);
String url_lwfrom = ColsDefine.getName(Url, "lwfrom");
this.parseSaoma(url_lwfrom);
this.setPV2(url_lwfrom, Url);
this.curr = querylist.poll();
}
public boolean isvalidate() {
return this.curr != null;
}
@Override
public boolean next() {
this.curr = querylist.poll();
return isvalidate();
}
@Override
public Number[] getSum() {
if(this.curr.isshaoma)
{
return new Number[] {
0
, 0
,0
, 0
, 0
, 0
, 0
, 0
,1
};
}else{
int type1=(this.curr.matchUrl.equals("wireless_zhadui"))?1:0;
int type2=(!this.curr.matchUrl.equals("wireless_zhadui"))?1:0;
return new Number[] {
type1
, 0
,0
, 0
, 0
, 0
, type2
, 0
, 0
};
}
}
@Override
public long getTs() {
return (ts / 10) * 10000;
}
@Override
public Object[] getGroup() {
long ts300 = (this.ts / 300) * 300000;
Date d = new Date(ts300);
return new String[] {
String.valueOf(ColsDefine.formatDay.format(d)),
String.valueOf(ColsDefine.formatMin.format(d)),
(this.curr.isshaoma||this.curr.matchUrl.equals("pc"))?"pc":"wireless",
"aplus_text",
this.curr.pid,
"", this.curr.tid, "",ColsDefine.version };
}
}
@Override
public String[] getSumName() {
return ColsDefine.colSumName;
}
@Override
public String getTableName() {
return ColsDefine.tablename;
}
@Override
public String[] getGroupName() {
return ColsDefine.colname;
}
}