/** * Copyright 2014, Emory University * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package edu.emory.clir.clearnlp.morphology.english; import java.util.Map; import java.util.Set; import edu.emory.clir.clearnlp.morphology.AbstractAffixReplacer; /** * @since 3.0.0 * @author Jinho D. Choi ({@code jinho.choi@emory.edu}) */ public class EnglishSuffixReplacer extends AbstractAffixReplacer { boolean b_doubleConsonants; public EnglishSuffixReplacer(String basePOS, String affixForm, String[] replacements, boolean doubleConsonants) { super(basePOS, affixForm, replacements); b_doubleConsonants = doubleConsonants; } @Override public String getBaseForm(Map<String,Set<String>> baseMap, String form) { return getBaseForm(baseMap.get(s_basePOS), form); } @Override public String getBaseForm(Set<String> baseSet, String form) { if (!form.endsWith(s_affixForm)) return null; int subLen = form.length() - s_affixForm.length(); String stem = form.substring(0, subLen); String base = getBaseFormAux(baseSet, stem); if (b_doubleConsonants && base == null && isDoubleConsonant(form, subLen)) { stem = form.substring(0, subLen-1); base = getBaseFormAux(baseSet, stem); } return base; } private String getBaseFormAux(Set<String> baseSet, String stem) { String base; for (String replacement : s_replacements) { base = stem + replacement; if (baseSet.contains(base)) return base; } return null; } private boolean isDoubleConsonant(String form, int subLen) { return subLen >= 4 && form.charAt(subLen-2) == form.charAt(subLen-1); } }