package com.bmk.crawler;
/**
* @Intro 是否满足链接路由规则
* @author Lee
* @Date 2013-8-7
*/
public class Filter {
private static String regex1 = "http://category.dangdang.com/all/?category_path=";
private static String regex2 = "/all/?category_path=";
private static String regex3 = "http://product.dangdang.com/product.aspx?product_id=";
public static int category_min_size = "http://category.dangdang.com/all/?category_path=01.38.00.00.00.00".length();
public static int product_min_size = "http://product.dangdang.com/product.aspx?product_id=23230517".length();
public static LinkFilter filter1 = new LinkFilter() {
@Override
public boolean accept(String url) {
//url.matches(regex1)
if(url.contains(regex1) && url.startsWith(regex1)){
return true;
}
return false;
}
};
public static LinkFilter filter2 = new LinkFilter() {
@Override
public boolean accept(String url) {
if(url.contains(regex2) && url.startsWith(regex2)){
return true;
}
return false;
}
};
public static LinkFilter filter3 = new LinkFilter() {
@Override
public boolean accept(String url) {
if(url.contains(regex3) && url.startsWith(regex3)){
return true;
}
return false;
}
};
}