You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

DeltaIndexScanner.java 4.2KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130
  1. /*
  2. * Copyright (C) 2010, Google Inc.
  3. * and other copyright owners as documented in the project's IP log.
  4. *
  5. * This program and the accompanying materials are made available
  6. * under the terms of the Eclipse Distribution License v1.0 which
  7. * accompanies this distribution, is reproduced below, and is
  8. * available at http://www.eclipse.org/org/documents/edl-v10.php
  9. *
  10. * All rights reserved.
  11. *
  12. * Redistribution and use in source and binary forms, with or
  13. * without modification, are permitted provided that the following
  14. * conditions are met:
  15. *
  16. * - Redistributions of source code must retain the above copyright
  17. * notice, this list of conditions and the following disclaimer.
  18. *
  19. * - Redistributions in binary form must reproduce the above
  20. * copyright notice, this list of conditions and the following
  21. * disclaimer in the documentation and/or other materials provided
  22. * with the distribution.
  23. *
  24. * - Neither the name of the Eclipse Foundation, Inc. nor the
  25. * names of its contributors may be used to endorse or promote
  26. * products derived from this software without specific prior
  27. * written permission.
  28. *
  29. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  30. * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  31. * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  32. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  33. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  34. * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  35. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  36. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  37. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  38. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  39. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  40. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  41. * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  42. */
  43. package org.eclipse.jgit.internal.storage.pack;
  44. /**
  45. * Supports {@link DeltaIndex} by performing a partial scan of the content.
  46. */
  47. class DeltaIndexScanner {
  48. final int[] table;
  49. // To save memory the buckets for hash chains are stored in correlated
  50. // arrays. This permits us to get 3 values per entry, without paying
  51. // the penalty for an object header on each entry.
  52. final long[] entries;
  53. final int[] next;
  54. final int tableMask;
  55. private int entryCnt;
  56. DeltaIndexScanner(byte[] raw, int len) {
  57. // Clip the length so it falls on a block boundary. We won't
  58. // bother to scan the final partial block.
  59. //
  60. len -= (len % DeltaIndex.BLKSZ);
  61. final int worstCaseBlockCnt = len / DeltaIndex.BLKSZ;
  62. if (worstCaseBlockCnt < 1) {
  63. table = new int[] {};
  64. tableMask = 0;
  65. entries = new long[] {};
  66. next = new int[] {};
  67. } else {
  68. table = new int[tableSize(worstCaseBlockCnt)];
  69. tableMask = table.length - 1;
  70. // As we insert blocks we preincrement so that 0 is never a
  71. // valid entry. Therefore we have to allocate one extra space.
  72. //
  73. entries = new long[1 + worstCaseBlockCnt];
  74. next = new int[entries.length];
  75. scan(raw, len);
  76. }
  77. }
  78. private void scan(byte[] raw, final int end) {
  79. // We scan the input backwards, and always insert onto the
  80. // front of the chain. This ensures that chains will have lower
  81. // offsets at the front of the chain, allowing us to prefer the
  82. // earlier match rather than the later match.
  83. //
  84. int lastHash = 0;
  85. int ptr = end - DeltaIndex.BLKSZ;
  86. do {
  87. final int key = DeltaIndex.hashBlock(raw, ptr);
  88. final int tIdx = key & tableMask;
  89. final int head = table[tIdx];
  90. if (head != 0 && lastHash == key) {
  91. // Two consecutive blocks have the same content hash,
  92. // prefer the earlier block because we want to use the
  93. // longest sequence we can during encoding.
  94. //
  95. entries[head] = (((long) key) << 32) | ptr;
  96. } else {
  97. final int eIdx = ++entryCnt;
  98. entries[eIdx] = (((long) key) << 32) | ptr;
  99. next[eIdx] = head;
  100. table[tIdx] = eIdx;
  101. }
  102. lastHash = key;
  103. ptr -= DeltaIndex.BLKSZ;
  104. } while (0 <= ptr);
  105. }
  106. private static int tableSize(final int worstCaseBlockCnt) {
  107. int shift = 32 - Integer.numberOfLeadingZeros(worstCaseBlockCnt);
  108. int sz = 1 << (shift - 1);
  109. if (sz < worstCaseBlockCnt)
  110. sz <<= 1;
  111. return sz;
  112. }
  113. }