package com.kennycason.kumo.nlp.normalize;
import java.util.regex.Pattern;
/**
* Created by kenny on 7/1/14.
*/
public class CharacterStrippingNormalizer implements Normalizer {
private static final Pattern DEFAULT_PATTERN = Pattern.compile("\\.|:|;|\\(|\\)|\"|,|\\?|,|!|<|>|/");
private static final String DEFAULT_REPLACE_WITH = "";
private final Pattern replacePattern;
private final String replaceWith;
public CharacterStrippingNormalizer() {
replacePattern = DEFAULT_PATTERN;
replaceWith = DEFAULT_REPLACE_WITH;
}
public CharacterStrippingNormalizer(final Pattern replacePattern, final String replaceWith) {
this.replacePattern = replacePattern;
this.replaceWith = replaceWith;
}
@Override
public String normalize(String text) {
return DEFAULT_PATTERN.matcher(text).replaceAll(DEFAULT_REPLACE_WITH);
}
}