You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

PatternMatchRevFilter.java 5.6KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159
  1. /*
  2. * Copyright (C) 2009, Google Inc.
  3. * Copyright (C) 2008, Shawn O. Pearce <spearce@spearce.org>
  4. * and other copyright owners as documented in the project's IP log.
  5. *
  6. * This program and the accompanying materials are made available
  7. * under the terms of the Eclipse Distribution License v1.0 which
  8. * accompanies this distribution, is reproduced below, and is
  9. * available at http://www.eclipse.org/org/documents/edl-v10.php
  10. *
  11. * All rights reserved.
  12. *
  13. * Redistribution and use in source and binary forms, with or
  14. * without modification, are permitted provided that the following
  15. * conditions are met:
  16. *
  17. * - Redistributions of source code must retain the above copyright
  18. * notice, this list of conditions and the following disclaimer.
  19. *
  20. * - Redistributions in binary form must reproduce the above
  21. * copyright notice, this list of conditions and the following
  22. * disclaimer in the documentation and/or other materials provided
  23. * with the distribution.
  24. *
  25. * - Neither the name of the Eclipse Foundation, Inc. nor the
  26. * names of its contributors may be used to endorse or promote
  27. * products derived from this software without specific prior
  28. * written permission.
  29. *
  30. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
  31. * CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,
  32. * INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  33. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  34. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
  35. * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  36. * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  37. * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
  38. * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
  39. * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
  40. * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  41. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
  42. * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  43. */
  44. package org.eclipse.jgit.revwalk.filter;
  45. import java.io.IOException;
  46. import java.util.regex.Matcher;
  47. import java.util.regex.Pattern;
  48. import org.eclipse.jgit.errors.IncorrectObjectTypeException;
  49. import org.eclipse.jgit.errors.MissingObjectException;
  50. import org.eclipse.jgit.internal.JGitText;
  51. import org.eclipse.jgit.lib.Constants;
  52. import org.eclipse.jgit.revwalk.RevCommit;
  53. import org.eclipse.jgit.revwalk.RevWalk;
  54. import org.eclipse.jgit.util.RawCharSequence;
  55. /**
  56. * Abstract filter that searches text using extended regular expressions.
  57. */
  58. public abstract class PatternMatchRevFilter extends RevFilter {
  59. /**
  60. * Encode a string pattern for faster matching on byte arrays.
  61. * <p>
  62. * Force the characters to our funny UTF-8 only convention that we use on
  63. * raw buffers. This avoids needing to perform character set decodes on the
  64. * individual commit buffers.
  65. *
  66. * @param patternText
  67. * original pattern string supplied by the user or the
  68. * application.
  69. * @return same pattern, but re-encoded to match our funny raw UTF-8
  70. * character sequence {@link org.eclipse.jgit.util.RawCharSequence}.
  71. */
  72. protected static final String forceToRaw(final String patternText) {
  73. final byte[] b = Constants.encode(patternText);
  74. final StringBuilder needle = new StringBuilder(b.length);
  75. for (int i = 0; i < b.length; i++)
  76. needle.append((char) (b[i] & 0xff));
  77. return needle.toString();
  78. }
  79. private final String patternText;
  80. private final Matcher compiledPattern;
  81. /**
  82. * Construct a new pattern matching filter.
  83. *
  84. * @param pattern
  85. * text of the pattern. Callers may want to surround their
  86. * pattern with ".*" on either end to allow matching in the
  87. * middle of the string.
  88. * @param innerString
  89. * should .* be wrapped around the pattern of ^ and $ are
  90. * missing? Most users will want this set.
  91. * @param rawEncoding
  92. * should {@link #forceToRaw(String)} be applied to the pattern
  93. * before compiling it?
  94. * @param flags
  95. * flags from {@link java.util.regex.Pattern} to control how
  96. * matching performs.
  97. */
  98. protected PatternMatchRevFilter(String pattern, final boolean innerString,
  99. final boolean rawEncoding, final int flags) {
  100. if (pattern.length() == 0)
  101. throw new IllegalArgumentException(JGitText.get().cannotMatchOnEmptyString);
  102. patternText = pattern;
  103. if (innerString) {
  104. if (!pattern.startsWith("^") && !pattern.startsWith(".*")) //$NON-NLS-1$ //$NON-NLS-2$
  105. pattern = ".*" + pattern; //$NON-NLS-1$
  106. if (!pattern.endsWith("$") && !pattern.endsWith(".*")) //$NON-NLS-1$ //$NON-NLS-2$
  107. pattern = pattern + ".*"; //$NON-NLS-1$
  108. }
  109. final String p = rawEncoding ? forceToRaw(pattern) : pattern;
  110. compiledPattern = Pattern.compile(p, flags).matcher(""); //$NON-NLS-1$
  111. }
  112. /**
  113. * Get the pattern this filter uses.
  114. *
  115. * @return the pattern this filter is applying to candidate strings.
  116. */
  117. public String pattern() {
  118. return patternText;
  119. }
  120. /** {@inheritDoc} */
  121. @Override
  122. public boolean include(final RevWalk walker, final RevCommit cmit)
  123. throws MissingObjectException, IncorrectObjectTypeException,
  124. IOException {
  125. return compiledPattern.reset(text(cmit)).matches();
  126. }
  127. /** {@inheritDoc} */
  128. @Override
  129. public boolean requiresCommitBody() {
  130. return true;
  131. }
  132. /**
  133. * Obtain the raw text to match against.
  134. *
  135. * @param cmit
  136. * current commit being evaluated.
  137. * @return sequence for the commit's content that we need to match on.
  138. */
  139. protected abstract CharSequence text(RevCommit cmit);
  140. /** {@inheritDoc} */
  141. @SuppressWarnings("nls")
  142. @Override
  143. public String toString() {
  144. return super.toString() + "(\"" + patternText + "\")";
  145. }
  146. }