/******************************************************************************* * Breakout Cave Survey Visualizer * * Copyright (C) 2014 James Edwards * * jedwards8 at fastmail dot fm * * This program is free software; you can redistribute it and/or modify it under * the terms of the GNU General Public License as published by the Free Software * Foundation; either version 2 of the License, or (at your option) any later * version. * * This program is distributed in the hope that it will be useful, but WITHOUT * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more * details. * * You should have received a copy of the GNU General Public License along with * this program; if not, write to the Free Software Foundation, Inc., 51 * Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. *******************************************************************************/ package org.andork.util; import java.util.ArrayList; import java.util.Collection; import java.util.HashMap; import java.util.List; import java.util.Map; public class LevenshteinCorrector { private final List<String> expected = new ArrayList<String>(); private final Map<String, String> corrections = new HashMap<String, String>(); public void addCorrection(String s, String correction) { corrections.put(s.toLowerCase(), correction); } public void addExpected(Collection<String> expected) { this.expected.addAll(expected); } public String correct(String s) { s = s.toLowerCase(); String correction = corrections.get(s); if (correction == null) { correction = s; int bestDist = s.length() * 3 / 4; for (String exp : expected) { String explc = exp.toLowerCase(); int dist = Levenshtein.distance(s, explc); if (s.startsWith(explc.substring(0, 1)) && dist < bestDist) { correction = exp; bestDist = dist; } } System.out.println(s + " -> " + correction); corrections.put(s, correction); } return correction; } }