/* * Copyright 2011 Greg Milette and Adam Stroud * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package root.gast.speech.text.match; /** * encode strings using soundex, but allow partial matches * @author Greg Milette <<a href="mailto:gregorym@gmail.com">gregorym@gmail.com</a>> */ public class SoundsLikeThresholdWordMatcher extends SoundsLikeWordMatcher { private int minimumCharactersSame; public SoundsLikeThresholdWordMatcher(int minimumCharactersSame, String... wordsIn) { super(wordsIn); this.minimumCharactersSame = minimumCharactersSame; } @Override public boolean isIn(String wordCheck) { boolean in = false; String compareTo = soundex.encode(wordCheck); for (String word : getWords()) { if (sameEncodedString(word, compareTo)) { in = true; break; } } return in; } private boolean sameEncodedString(String s1, String s2) { int numSame = 0; for (int i = 0; i < s1.length(); i++) { char c1 = s1.charAt(i); char c2 = s2.charAt(i); if (c1 == c2) { numSame++; } } return (numSame >= minimumCharactersSame); } }