/* * Copyright (C) 2010, Google Inc. * and other copyright owners as documented in the project's IP log. * * This program and the accompanying materials are made available * under the terms of the Eclipse Distribution License v1.0 which * accompanies this distribution, is reproduced below, and is * available at http://www.eclipse.org/org/documents/edl-v10.php * * All rights reserved. * * Redistribution and use in source and binary forms, with or * without modification, are permitted provided that the following * conditions are met: * * - Redistributions of source code must retain the above copyright * notice, this list of conditions and the following disclaimer. * * - Redistributions in binary form must reproduce the above * copyright notice, this list of conditions and the following * disclaimer in the documentation and/or other materials provided * with the distribution. * * - Neither the name of the Eclipse Foundation, Inc. nor the * names of its contributors may be used to endorse or promote * products derived from this software without specific prior * written permission. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ package org.eclipse.jgit.diff; import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertTrue; import java.io.ByteArrayInputStream; import java.io.IOException; import org.eclipse.jgit.diff.SimilarityIndex.TableFullException; import org.eclipse.jgit.lib.Constants; import org.junit.Test; public class SimilarityIndexTest { @Test public void testIndexingSmallObject() throws TableFullException { SimilarityIndex si = hash("" // + "A\n" // + "B\n" // + "D\n" // + "B\n" // ); int key_A = keyFor("A\n"); int key_B = keyFor("B\n"); int key_D = keyFor("D\n"); assertTrue(key_A != key_B && key_A != key_D && key_B != key_D); assertEquals(3, si.size()); assertEquals(2, si.count(si.findIndex(key_A))); assertEquals(4, si.count(si.findIndex(key_B))); assertEquals(2, si.count(si.findIndex(key_D))); } @Test public void testIndexingLargeObject() throws IOException, TableFullException { byte[] in = ("" // + "A\n" // + "B\n" // + "B\n" // + "B\n").getBytes("UTF-8"); SimilarityIndex si = new SimilarityIndex(); si.hash(new ByteArrayInputStream(in), in.length, false); assertEquals(2, si.size()); } @Test public void testCommonScore_SameFiles() throws TableFullException { String text = "" // + "A\n" // + "B\n" // + "D\n" // + "B\n"; SimilarityIndex src = hash(text); SimilarityIndex dst = hash(text); assertEquals(8, src.common(dst)); assertEquals(8, dst.common(src)); assertEquals(100, src.score(dst, 100)); assertEquals(100, dst.score(src, 100)); } @Test public void testCommonScore_SameFiles_CR_canonicalization() throws TableFullException { String text = "" // + "A\r\n" // + "B\r\n" // + "D\r\n" // + "B\r\n"; SimilarityIndex src = hash(text); SimilarityIndex dst = hash(text.replace("\r", "")); assertEquals(8, src.common(dst)); assertEquals(8, dst.common(src)); assertEquals(100, src.score(dst, 100)); assertEquals(100, dst.score(src, 100)); } @Test public void testCommonScoreLargeObject_SameFiles_CR_canonicalization() throws TableFullException, IOException { String text = "" // + "A\r\n" // + "B\r\n" // + "D\r\n" // + "B\r\n"; SimilarityIndex src = new SimilarityIndex(); byte[] bytes1 = text.getBytes("UTF-8"); src.hash(new ByteArrayInputStream(bytes1), bytes1.length, true); src.sort(); SimilarityIndex dst = new SimilarityIndex(); byte[] bytes2 = text.replace("\r", "").getBytes("UTF-8"); dst.hash(new ByteArrayInputStream(bytes2), bytes2.length, true); dst.sort(); assertEquals(8, src.common(dst)); assertEquals(8, dst.common(src)); assertEquals(100, src.score(dst, 100)); assertEquals(100, dst.score(src, 100)); } @Test public void testCommonScore_EmptyFiles() throws TableFullException { SimilarityIndex src = hash(""); SimilarityIndex dst = hash(""); assertEquals(0, src.common(dst)); assertEquals(0, dst.common(src)); } @Test public void testCommonScore_TotallyDifferentFiles() throws TableFullException { SimilarityIndex src = hash("A\n"); SimilarityIndex dst = hash("D\n"); assertEquals(0, src.common(dst)); assertEquals(0, dst.common(src)); } @Test public void testCommonScore_SimiliarBy75() throws TableFullException { SimilarityIndex src = hash("A\nB\nC\nD\n"); SimilarityIndex dst = hash("A\nB\nC\nQ\n"); assertEquals(6, src.common(dst)); assertEquals(6, dst.common(src)); assertEquals(75, src.score(dst, 100)); assertEquals(75, dst.score(src, 100)); } private static SimilarityIndex hash(String text) throws TableFullException { SimilarityIndex src = new SimilarityIndex(); byte[] raw = Constants.encode(text); src.hash(raw, 0, raw.length); src.sort(); return src; } private static int keyFor(String line) throws TableFullException { SimilarityIndex si = hash(line); assertEquals("single line scored", 1, si.size()); return si.key(0); } }