/*
* EnglishSeoStopWordCleaner.java created on 2011-01-26
*
* Created by Brushing Bits Labs
* http://www.brushingbits.org
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.brushingbits.jnap.common.seo;
import java.util.Locale;
/**
* @author Daniel Rochetti
* @since 1.0
*/
public class EnglishSeoStopWordCleaner extends RegExpSeoStopWordCleaner {
private static final Locale[] SUPPORTED_LOCALES = new Locale[] {
Locale.ENGLISH, Locale.UK, Locale.US };
private static final String[] STOP_WORDS = new String[] { "about", "after",
"again", "all", "almost", "also", "although", "always", "among",
"an", "and", "another", "any", "approximately", "are", "aren't",
"as", "at", "be", "because", "been", "before", "being", "between",
"both", "but", "by", "can", "could", "did", "do", "does", "done",
"due", "during", "each", "either", "enough", "especially", "etc",
"followed", "following", "for", "found", "from", "further", "give",
"given", "giving", "had", "hardly", "has", "have", "haven't",
"having", "here", "how", "however", "if", "in", "into", "is", "it",
"its", "itself", "just", "kg", "km", "largely", "like", "made",
"mainly", "make", "may", "might", "min", "ml", "mm", "more",
"most", "mostly", "must", "nearly", "neither", "no", "nor", "not",
"now", "obtain", "obtained", "of", "often", "on", "only", "or",
"other", "our", "out", "over", "overall", "per", "perhaps",
"possible", "previously", "quite", "rather", "really", "regarding",
"resulted", "resulting", "same", "seem", "seen", "several",
"should", "show", "showed", "shown", "shows", "significant",
"significantly", "since", "so", "some", "such", "suggest", "than",
"that", "the", "their", "theirs", "them", "then", "there", "these",
"they", "this", "those", "through", "thus", "to", "under", "up",
"upon", "use", "used", "using", "various", "very", "was", "wasn't",
"we", "were", "weren't", "what", "when", "whereas", "which",
"while", "will", "with", "within", "without", "would", "wouldn't" };
public Locale[] getSupportedLocales() {
return SUPPORTED_LOCALES;
}
public String[] getSeoStopWords() {
return STOP_WORDS;
}
}