/*******************************************************************************
*
* Copyright (c) 2004-2011 Oracle Corporation
*
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
* Kohsuke Kawaguchi
*
*******************************************************************************/
package hudson.util;
import java.util.Collection;
import java.util.Arrays;
/**
* Computes the string edit distance.
*
* <p> Refer to a computer science text book for the definition of the "string
* edit distance".
*
* @author Kohsuke Kawaguchi (kohsuke.kawaguchi@sun.com)
*/
public class EditDistance {
/**
* Computes the edit distance between two strings.
*
* <p> The complexity is O(nm) where n=a.length() and m=b.length().
*/
public static int editDistance(String a, String b) {
return new EditDistance(a, b).calc();
}
/**
* Finds the string in the
* <code>group</code> closest to
* <code>key</code> and returns it.
*
* @return null if group.length==0.
*/
public static String findNearest(String key, String[] group) {
return findNearest(key, Arrays.asList(group));
}
public static String findNearest(String key, Collection<String> group) {
int c = Integer.MAX_VALUE;
String r = null;
for (String g : group) {
int ed = editDistance(key, g);
if (c > ed) {
c = ed;
r = g;
}
}
return r;
}
/**
* cost vector.
*/
private int[] cost;
/**
* back buffer.
*/
private int[] back;
/**
* Two strings to be compared.
*/
private final String a, b;
private EditDistance(String a, String b) {
this.a = a;
this.b = b;
cost = new int[a.length() + 1];
back = new int[a.length() + 1]; // back buffer
for (int i = 0; i <= a.length(); i++) {
cost[i] = i;
}
}
/**
* Swaps two buffers.
*/
private void flip() {
int[] t = cost;
cost = back;
back = t;
}
private int min(int a, int b, int c) {
return Math.min(a, Math.min(b, c));
}
private int calc() {
for (int j = 0; j < b.length(); j++) {
flip();
cost[0] = j + 1;
for (int i = 0; i < a.length(); i++) {
int match = (a.charAt(i) == b.charAt(j)) ? 0 : 1;
cost[i + 1] = min(back[i] + match, cost[i] + 1, back[i + 1] + 1);
}
}
return cost[a.length()];
}
}