You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

RawSubStringPattern.java 4.4KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138
  1. /*
  2. * Copyright (C) 2009, Google Inc.
  3. * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
  4. * and other copyright owners as documented in the project's IP log.
  5. *
  6. * This program and the accompanying materials are made available
  7. * under the terms of the Eclipse Distribution License v1.0 which
  8. * accompanies this distribution, is reproduced below, and is
  9. * available at http://www.eclipse.org/org/documents/edl-v10.php
  10. *
  11. * All rights reserved.
  12. *
  13. * Redistribution and use in source and binary forms, with or
  14. * without modification, are permitted provided that the following
  15. * conditions are met:
  16. *
  17. * - Redistributions of source code must retain the above copyright
  18. * notice, this list of conditions and the following disclaimer.
  19. *
  20. * - Redistributions in binary form must reproduce the above
  21. * copyright notice, this list of conditions and the following
  22. * disclaimer in the documentation and/or other materials provided
  23. * with the distribution.
  24. *
  25. * - Neither the name of the Eclipse Foundation, Inc. nor the
  26. * names of its contributors may be used to endorse or promote
  27. * products derived from this software without specific prior
  28. * written permission.
  29. *
  30. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  31. * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  32. * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  33. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  34. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  35. * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  36. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  37. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  38. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  39. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  40. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  41. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  42. * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  43. */
  44. package org.eclipse.jgit.util;
  45. import org.eclipse.jgit.internal.JGitText;
  46. import org.eclipse.jgit.lib.Constants;
  47. /**
  48. * Searches text using only substring search.
  49. * <p>
  50. * Instances are thread-safe. Multiple concurrent threads may perform matches on
  51. * different character sequences at the same time.
  52. */
  53. public class RawSubStringPattern {
  54. private final String needleString;
  55. private final byte[] needle;
  56. /**
  57. * Construct a new substring pattern.
  58. *
  59. * @param patternText
  60. * text to locate. This should be a literal string, as no
  61. * meta-characters are supported by this implementation. The
  62. * string may not be the empty string.
  63. */
  64. public RawSubStringPattern(final String patternText) {
  65. if (patternText.length() == 0)
  66. throw new IllegalArgumentException(JGitText.get().cannotMatchOnEmptyString);
  67. needleString = patternText;
  68. final byte[] b = Constants.encode(patternText);
  69. needle = new byte[b.length];
  70. for (int i = 0; i < b.length; i++)
  71. needle[i] = lc(b[i]);
  72. }
  73. /**
  74. * Match a character sequence against this pattern.
  75. *
  76. * @param rcs
  77. * the sequence to match. Must not be null but the length of the
  78. * sequence is permitted to be 0.
  79. * @return offset within <code>rcs</code> of the first occurrence of this
  80. * pattern; -1 if this pattern does not appear at any position of
  81. * <code>rcs</code>.
  82. */
  83. public int match(final RawCharSequence rcs) {
  84. final int needleLen = needle.length;
  85. final byte first = needle[0];
  86. final byte[] text = rcs.buffer;
  87. int matchPos = rcs.startPtr;
  88. final int maxPos = rcs.endPtr - needleLen;
  89. OUTER: for (; matchPos <= maxPos; matchPos++) {
  90. if (neq(first, text[matchPos])) {
  91. while (++matchPos <= maxPos && neq(first, text[matchPos])) {
  92. /* skip */
  93. }
  94. if (matchPos > maxPos)
  95. return -1;
  96. }
  97. int si = matchPos + 1;
  98. for (int j = 1; j < needleLen; j++, si++) {
  99. if (neq(needle[j], text[si]))
  100. continue OUTER;
  101. }
  102. return matchPos;
  103. }
  104. return -1;
  105. }
  106. private static final boolean neq(final byte a, final byte b) {
  107. return a != b && a != lc(b);
  108. }
  109. private static final byte lc(final byte q) {
  110. return (byte) StringUtils.toLowerCase((char) (q & 0xff));
  111. }
  112. /**
  113. * Get the literal pattern string this instance searches for.
  114. *
  115. * @return the pattern string given to our constructor.
  116. */
  117. public String pattern() {
  118. return needleString;
  119. }
  120. @Override
  121. public String toString() {
  122. return pattern();
  123. }
  124. }