123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190 |
- /*
- * Copyright (C) 2010, Google Inc.
- * and other copyright owners as documented in the project's IP log.
- *
- * This program and the accompanying materials are made available
- * under the terms of the Eclipse Distribution License v1.0 which
- * accompanies this distribution, is reproduced below, and is
- * available at http://www.eclipse.org/org/documents/edl-v10.php
- *
- * All rights reserved.
- *
- * Redistribution and use in source and binary forms, with or
- * without modification, are permitted provided that the following
- * conditions are met:
- *
- * - Redistributions of source code must retain the above copyright
- * notice, this list of conditions and the following disclaimer.
- *
- * - Redistributions in binary form must reproduce the above
- * copyright notice, this list of conditions and the following
- * disclaimer in the documentation and/or other materials provided
- * with the distribution.
- *
- * - Neither the name of the Eclipse Foundation, Inc. nor the
- * names of its contributors may be used to endorse or promote
- * products derived from this software without specific prior
- * written permission.
- *
- * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
- * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
- * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
- * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
- * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
- * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
- * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
- * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
- * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
- * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
- * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
- * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
- * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
- */
-
- package org.eclipse.jgit.diff;
-
- import static java.nio.charset.StandardCharsets.UTF_8;
- import static org.junit.Assert.assertEquals;
- import static org.junit.Assert.assertTrue;
-
- import java.io.ByteArrayInputStream;
- import java.io.IOException;
-
- import org.eclipse.jgit.diff.SimilarityIndex.TableFullException;
- import org.eclipse.jgit.lib.Constants;
- import org.junit.Test;
-
- public class SimilarityIndexTest {
- @Test
- public void testIndexingSmallObject() throws TableFullException {
- SimilarityIndex si = hash("" //
- + "A\n" //
- + "B\n" //
- + "D\n" //
- + "B\n" //
- );
-
- int key_A = keyFor("A\n");
- int key_B = keyFor("B\n");
- int key_D = keyFor("D\n");
- assertTrue(key_A != key_B && key_A != key_D && key_B != key_D);
-
- assertEquals(3, si.size());
- assertEquals(2, si.count(si.findIndex(key_A)));
- assertEquals(4, si.count(si.findIndex(key_B)));
- assertEquals(2, si.count(si.findIndex(key_D)));
- }
-
- @Test
- public void testIndexingLargeObject() throws IOException,
- TableFullException {
- byte[] in = ("" //
- + "A\n" //
- + "B\n" //
- + "B\n" //
- + "B\n").getBytes(UTF_8);
- SimilarityIndex si = new SimilarityIndex();
- si.hash(new ByteArrayInputStream(in), in.length, false);
- assertEquals(2, si.size());
- }
-
- @Test
- public void testCommonScore_SameFiles() throws TableFullException {
- String text = "" //
- + "A\n" //
- + "B\n" //
- + "D\n" //
- + "B\n";
- SimilarityIndex src = hash(text);
- SimilarityIndex dst = hash(text);
- assertEquals(8, src.common(dst));
- assertEquals(8, dst.common(src));
-
- assertEquals(100, src.score(dst, 100));
- assertEquals(100, dst.score(src, 100));
- }
-
- @Test
- public void testCommonScore_SameFiles_CR_canonicalization()
- throws TableFullException {
- String text = "" //
- + "A\r\n" //
- + "B\r\n" //
- + "D\r\n" //
- + "B\r\n";
- SimilarityIndex src = hash(text);
- SimilarityIndex dst = hash(text.replace("\r", ""));
- assertEquals(8, src.common(dst));
- assertEquals(8, dst.common(src));
-
- assertEquals(100, src.score(dst, 100));
- assertEquals(100, dst.score(src, 100));
- }
-
- @Test
- public void testCommonScoreLargeObject_SameFiles_CR_canonicalization()
- throws TableFullException, IOException {
- String text = "" //
- + "A\r\n" //
- + "B\r\n" //
- + "D\r\n" //
- + "B\r\n";
- SimilarityIndex src = new SimilarityIndex();
- byte[] bytes1 = text.getBytes(UTF_8);
- src.hash(new ByteArrayInputStream(bytes1), bytes1.length, true);
- src.sort();
-
- SimilarityIndex dst = new SimilarityIndex();
- byte[] bytes2 = text.replace("\r", "").getBytes(UTF_8);
- dst.hash(new ByteArrayInputStream(bytes2), bytes2.length, true);
- dst.sort();
-
- assertEquals(8, src.common(dst));
- assertEquals(8, dst.common(src));
-
- assertEquals(100, src.score(dst, 100));
- assertEquals(100, dst.score(src, 100));
- }
-
- @Test
- public void testCommonScore_EmptyFiles() throws TableFullException {
- SimilarityIndex src = hash("");
- SimilarityIndex dst = hash("");
- assertEquals(0, src.common(dst));
- assertEquals(0, dst.common(src));
- }
-
- @Test
- public void testCommonScore_TotallyDifferentFiles()
- throws TableFullException {
- SimilarityIndex src = hash("A\n");
- SimilarityIndex dst = hash("D\n");
- assertEquals(0, src.common(dst));
- assertEquals(0, dst.common(src));
- }
-
- @Test
- public void testCommonScore_SimiliarBy75() throws TableFullException {
- SimilarityIndex src = hash("A\nB\nC\nD\n");
- SimilarityIndex dst = hash("A\nB\nC\nQ\n");
- assertEquals(6, src.common(dst));
- assertEquals(6, dst.common(src));
-
- assertEquals(75, src.score(dst, 100));
- assertEquals(75, dst.score(src, 100));
- }
-
- private static SimilarityIndex hash(String text) throws TableFullException {
- SimilarityIndex src = new SimilarityIndex();
- byte[] raw = Constants.encode(text);
- src.hash(raw, 0, raw.length);
- src.sort();
- return src;
- }
-
- private static int keyFor(String line) throws TableFullException {
- SimilarityIndex si = hash(line);
- assertEquals("single line scored", 1, si.size());
- return si.key(0);
- }
- }
|