package owlaccessor;
import java.util.HashSet;
import java.util.Set;
import java.util.StringTokenizer;
import outputter.knowledge.Dictionary;
public class WordFilter {
private Set<String> wl;
public WordFilter(){
wl = new HashSet<String>();
wl.addAll(createSubset(Dictionary.STOP));
wl.addAll(createSubset(Dictionary.NUMBERS));
wl.addAll(createSubset(Dictionary.FORBIDDEN));
wl.addAll(createSubset(Dictionary.PRONOUN));
wl.addAll(createSubset(Dictionary.CHARACTER));
wl.addAll(createSubset(Dictionary.PROPOSITION));
wl.addAll(createSubset(Dictionary.CLUSTER));
wl.addAll(createSubset(Dictionary.SUBSTRUCTURE));
wl.addAll(createSubset(Dictionary.ADDITIONAL));
wl.add("bearer");
wl.add("bearer's");
wl.add("inhering");
wl.add("virtue");
}
/*
* s contains words to be eliminated separated by space
*
* */
private Set<String> createSubset(String s){
Set<String> result = new HashSet<String>();
StringTokenizer st = new StringTokenizer(s, "|");
while (st.hasMoreTokens()){
result.add(st.nextToken().trim());
}
return result;
}
public boolean isInList(String s){
if(wl.contains(s.trim().toLowerCase()))
return true;
else
return false;
}
}