| /* |
| * Copyright (C) 2010, Google Inc. |
| * and other copyright owners as documented in the project's IP log. |
| * |
| * This program and the accompanying materials are made available |
| * under the terms of the Eclipse Distribution License v1.0 which |
| * accompanies this distribution, is reproduced below, and is |
| * available at http://www.eclipse.org/org/documents/edl-v10.php |
| * |
| * All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or |
| * without modification, are permitted provided that the following |
| * conditions are met: |
| * |
| * - Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * |
| * - Redistributions in binary form must reproduce the above |
| * copyright notice, this list of conditions and the following |
| * disclaimer in the documentation and/or other materials provided |
| * with the distribution. |
| * |
| * - Neither the name of the Eclipse Foundation, Inc. nor the |
| * names of its contributors may be used to endorse or promote |
| * products derived from this software without specific prior |
| * written permission. |
| * |
| * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND |
| * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, |
| * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES |
| * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE |
| * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR |
| * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
| * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT |
| * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |
| * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER |
| * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, |
| * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) |
| * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF |
| * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| package org.eclipse.jgit.diff; |
| |
| import static java.nio.charset.StandardCharsets.UTF_8; |
| import static org.junit.Assert.assertEquals; |
| import static org.junit.Assert.assertTrue; |
| |
| import java.io.ByteArrayInputStream; |
| import java.io.IOException; |
| |
| import org.eclipse.jgit.diff.SimilarityIndex.TableFullException; |
| import org.eclipse.jgit.lib.Constants; |
| import org.junit.Test; |
| |
| public class SimilarityIndexTest { |
| @Test |
| public void testIndexingSmallObject() throws TableFullException { |
| SimilarityIndex si = hash("" // |
| + "A\n" // |
| + "B\n" // |
| + "D\n" // |
| + "B\n" // |
| ); |
| |
| int key_A = keyFor("A\n"); |
| int key_B = keyFor("B\n"); |
| int key_D = keyFor("D\n"); |
| assertTrue(key_A != key_B && key_A != key_D && key_B != key_D); |
| |
| assertEquals(3, si.size()); |
| assertEquals(2, si.count(si.findIndex(key_A))); |
| assertEquals(4, si.count(si.findIndex(key_B))); |
| assertEquals(2, si.count(si.findIndex(key_D))); |
| } |
| |
| @Test |
| public void testIndexingLargeObject() throws IOException, |
| TableFullException { |
| byte[] in = ("" // |
| + "A\n" // |
| + "B\n" // |
| + "B\n" // |
| + "B\n").getBytes(UTF_8); |
| SimilarityIndex si = new SimilarityIndex(); |
| si.hash(new ByteArrayInputStream(in), in.length, false); |
| assertEquals(2, si.size()); |
| } |
| |
| @Test |
| public void testCommonScore_SameFiles() throws TableFullException { |
| String text = "" // |
| + "A\n" // |
| + "B\n" // |
| + "D\n" // |
| + "B\n"; |
| SimilarityIndex src = hash(text); |
| SimilarityIndex dst = hash(text); |
| assertEquals(8, src.common(dst)); |
| assertEquals(8, dst.common(src)); |
| |
| assertEquals(100, src.score(dst, 100)); |
| assertEquals(100, dst.score(src, 100)); |
| } |
| |
| @Test |
| public void testCommonScore_SameFiles_CR_canonicalization() |
| throws TableFullException { |
| String text = "" // |
| + "A\r\n" // |
| + "B\r\n" // |
| + "D\r\n" // |
| + "B\r\n"; |
| SimilarityIndex src = hash(text); |
| SimilarityIndex dst = hash(text.replace("\r", "")); |
| assertEquals(8, src.common(dst)); |
| assertEquals(8, dst.common(src)); |
| |
| assertEquals(100, src.score(dst, 100)); |
| assertEquals(100, dst.score(src, 100)); |
| } |
| |
| @Test |
| public void testCommonScoreLargeObject_SameFiles_CR_canonicalization() |
| throws TableFullException, IOException { |
| String text = "" // |
| + "A\r\n" // |
| + "B\r\n" // |
| + "D\r\n" // |
| + "B\r\n"; |
| SimilarityIndex src = new SimilarityIndex(); |
| byte[] bytes1 = text.getBytes(UTF_8); |
| src.hash(new ByteArrayInputStream(bytes1), bytes1.length, true); |
| src.sort(); |
| |
| SimilarityIndex dst = new SimilarityIndex(); |
| byte[] bytes2 = text.replace("\r", "").getBytes(UTF_8); |
| dst.hash(new ByteArrayInputStream(bytes2), bytes2.length, true); |
| dst.sort(); |
| |
| assertEquals(8, src.common(dst)); |
| assertEquals(8, dst.common(src)); |
| |
| assertEquals(100, src.score(dst, 100)); |
| assertEquals(100, dst.score(src, 100)); |
| } |
| |
| @Test |
| public void testCommonScore_EmptyFiles() throws TableFullException { |
| SimilarityIndex src = hash(""); |
| SimilarityIndex dst = hash(""); |
| assertEquals(0, src.common(dst)); |
| assertEquals(0, dst.common(src)); |
| } |
| |
| @Test |
| public void testCommonScore_TotallyDifferentFiles() |
| throws TableFullException { |
| SimilarityIndex src = hash("A\n"); |
| SimilarityIndex dst = hash("D\n"); |
| assertEquals(0, src.common(dst)); |
| assertEquals(0, dst.common(src)); |
| } |
| |
| @Test |
| public void testCommonScore_SimiliarBy75() throws TableFullException { |
| SimilarityIndex src = hash("A\nB\nC\nD\n"); |
| SimilarityIndex dst = hash("A\nB\nC\nQ\n"); |
| assertEquals(6, src.common(dst)); |
| assertEquals(6, dst.common(src)); |
| |
| assertEquals(75, src.score(dst, 100)); |
| assertEquals(75, dst.score(src, 100)); |
| } |
| |
| private static SimilarityIndex hash(String text) throws TableFullException { |
| SimilarityIndex src = new SimilarityIndex(); |
| byte[] raw = Constants.encode(text); |
| src.hash(raw, 0, raw.length); |
| src.sort(); |
| return src; |
| } |
| |
| private static int keyFor(String line) throws TableFullException { |
| SimilarityIndex si = hash(line); |
| assertEquals("single line scored", 1, si.size()); |
| return si.key(0); |
| } |
| } |