package com.geccocrawler.gecco.demo.sogouwx;
import java.util.List;
import com.geccocrawler.gecco.GeccoEngine;
import com.geccocrawler.gecco.annotation.Gecco;
import com.geccocrawler.gecco.annotation.HtmlField;
import com.geccocrawler.gecco.annotation.RequestParameter;
import com.geccocrawler.gecco.request.HttpGetRequest;
import com.geccocrawler.gecco.spider.HtmlBean;
@Gecco(matchUrl="http://weixin.sogou.com/weixin?type=2&query={keyword}", pipelines={"consolePipeline"})
public class SogouWX implements HtmlBean {
private static final long serialVersionUID = 7504646787612579665L;
@RequestParameter
private String keyword;
@HtmlField(cssPath=".results .wx-rb")
private List<WeiXin> weixins;
public String getKeyword() {
return keyword;
}
public void setKeyword(String keyword) {
this.keyword = keyword;
}
public List<WeiXin> getWeixins() {
return weixins;
}
public void setWeixins(List<WeiXin> weixins) {
this.weixins = weixins;
}
public static void main(String[] args) {
HttpGetRequest start = new HttpGetRequest("http://weixin.sogou.com/weixin?type=2&query=%E6%B7%B1%E5%9C%B3");
start.addCookie("SNUID", "1D22392EF4F6C4A92076C208F4DE3AAB");
start.addCookie("SUID", "EED1CDDA6B20900A00000000570E1872");
start.addCookie("IPLOC", "CN1100");
//start.addCookie("SUV", "1460541527037365");
start.addHeader("Host", "weixin.sogou.com");
start.addHeader("Upgrade-Insecure-Requests", "1");
start.addHeader("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8");
start.addHeader("Accept-Encoding", "gzip, deflate, sdch");
start.addHeader("Cache-Control", "max-age=0");
GeccoEngine.create()
.classpath("com.geccocrawler.gecco.demo.sogouwx")
.start(start)
//.start("http://mp.weixin.qq.com/s?__biz=MzAwMjIyODIwNA==&mid=2650194319&idx=7&sn=5fbba7eb7f393508461468ea5c412ba5&3rd=MzA3MDU4NTYzMw==&scene=6")
.interval(5000)
.run();
}
}