/*
* Copyright 2011 gitblit.com.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.gitblit.utils;
import java.io.ByteArrayOutputStream;
import java.io.UnsupportedEncodingException;
import java.nio.ByteBuffer;
import java.nio.CharBuffer;
import java.nio.charset.CharacterCodingException;
import java.nio.charset.Charset;
import java.nio.charset.CharsetDecoder;
import java.nio.charset.IllegalCharsetNameException;
import java.nio.charset.UnsupportedCharsetException;
import java.security.MessageDigest;
import java.security.NoSuchAlgorithmException;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collection;
import java.util.Collections;
import java.util.Comparator;
import java.util.LinkedHashSet;
import java.util.List;
import java.util.Set;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import java.util.regex.PatternSyntaxException;
/**
* Utility class of string functions.
*
* @author James Moger
*
*/
public class StringUtils {
public static final String MD5_TYPE = "MD5:";
public static final String COMBINED_MD5_TYPE = "CMD5:";
/**
* Returns true if the string is null or empty.
*
* @param value
* @return true if string is null or empty
*/
public static boolean isEmpty(String value) {
return value == null || value.trim().length() == 0;
}
/**
* Replaces carriage returns and line feeds with html line breaks.
*
* @param string
* @return plain text with html line breaks
*/
public static String breakLinesForHtml(String string) {
return string.replace("\r\n", "
").replace("\r", "
").replace("\n", "
");
}
/**
* Prepare text for html presentation. Replace sensitive characters with
* html entities.
*
* @param inStr
* @param changeSpace
* @return plain text escaped for html
*/
public static String escapeForHtml(String inStr, boolean changeSpace) {
StringBuilder retStr = new StringBuilder();
int i = 0;
while (i < inStr.length()) {
if (inStr.charAt(i) == '&') {
retStr.append("&");
} else if (inStr.charAt(i) == '<') {
retStr.append("<");
} else if (inStr.charAt(i) == '>') {
retStr.append(">");
} else if (inStr.charAt(i) == '\"') {
retStr.append(""");
} else if (changeSpace && inStr.charAt(i) == ' ') {
retStr.append(" ");
} else if (changeSpace && inStr.charAt(i) == '\t') {
retStr.append(" ");
} else {
retStr.append(inStr.charAt(i));
}
i++;
}
return retStr.toString();
}
/**
* Decode html entities back into plain text characters.
*
* @param inStr
* @return returns plain text from html
*/
public static String decodeFromHtml(String inStr) {
return inStr.replace("&", "&").replace("<", "<").replace(">", ">")
.replace(""", "\"").replace(" ", " ");
}
/**
* Encodes a url parameter by escaping troublesome characters.
*
* @param inStr
* @return properly escaped url
*/
public static String encodeURL(String inStr) {
StringBuilder retStr = new StringBuilder();
int i = 0;
while (i < inStr.length()) {
if (inStr.charAt(i) == '/') {
retStr.append("%2F");
} else if (inStr.charAt(i) == ' ') {
retStr.append("%20");
} else {
retStr.append(inStr.charAt(i));
}
i++;
}
return retStr.toString();
}
/**
* Flatten the list of strings into a single string with a space separator.
*
* @param values
* @return flattened list
*/
public static String flattenStrings(Collection values) {
return flattenStrings(values, " ");
}
/**
* Flatten the list of strings into a single string with the specified
* separator.
*
* @param values
* @param separator
* @return flattened list
*/
public static String flattenStrings(Collection values, String separator) {
StringBuilder sb = new StringBuilder();
for (String value : values) {
sb.append(value).append(separator);
}
if (sb.length() > 0) {
// truncate trailing separator
sb.setLength(sb.length() - separator.length());
}
return sb.toString().trim();
}
/**
* Returns a string trimmed to a maximum length with trailing ellipses. If
* the string length is shorter than the max, the original string is
* returned.
*
* @param value
* @param max
* @return trimmed string
*/
public static String trimString(String value, int max) {
if (value.length() <= max) {
return value;
}
return value.substring(0, max - 3) + "...";
}
/**
* Left pad a string with the specified character, if the string length is
* less than the specified length.
*
* @param input
* @param length
* @param pad
* @return left-padded string
*/
public static String leftPad(String input, int length, char pad) {
if (input.length() < length) {
StringBuilder sb = new StringBuilder();
for (int i = 0, len = length - input.length(); i < len; i++) {
sb.append(pad);
}
sb.append(input);
return sb.toString();
}
return input;
}
/**
* Right pad a string with the specified character, if the string length is
* less then the specified length.
*
* @param input
* @param length
* @param pad
* @return right-padded string
*/
public static String rightPad(String input, int length, char pad) {
if (input.length() < length) {
StringBuilder sb = new StringBuilder();
sb.append(input);
for (int i = 0, len = length - input.length(); i < len; i++) {
sb.append(pad);
}
return sb.toString();
}
return input;
}
/**
* Calculates the SHA1 of the string.
*
* @param text
* @return sha1 of the string
*/
public static String getSHA1(String text) {
try {
byte[] bytes = text.getBytes("iso-8859-1");
return getSHA1(bytes);
} catch (UnsupportedEncodingException u) {
throw new RuntimeException(u);
}
}
/**
* Calculates the SHA1 of the byte array.
*
* @param bytes
* @return sha1 of the byte array
*/
public static String getSHA1(byte[] bytes) {
try {
MessageDigest md = MessageDigest.getInstance("SHA-1");
md.update(bytes, 0, bytes.length);
byte[] digest = md.digest();
return toHex(digest);
} catch (NoSuchAlgorithmException t) {
throw new RuntimeException(t);
}
}
/**
* Calculates the MD5 of the string.
*
* @param string
* @return md5 of the string
*/
public static String getMD5(String string) {
try {
return getMD5(string.getBytes("iso-8859-1"));
} catch (UnsupportedEncodingException u) {
throw new RuntimeException(u);
}
}
/**
* Calculates the MD5 of the string.
*
* @param string
* @return md5 of the string
*/
public static String getMD5(byte [] bytes) {
try {
MessageDigest md = MessageDigest.getInstance("MD5");
md.reset();
md.update(bytes);
byte[] digest = md.digest();
return toHex(digest);
} catch (NoSuchAlgorithmException t) {
throw new RuntimeException(t);
}
}
/**
* Returns the hex representation of the byte array.
*
* @param bytes
* @return byte array as hex string
*/
private static String toHex(byte[] bytes) {
StringBuilder sb = new StringBuilder(bytes.length * 2);
for (int i = 0; i < bytes.length; i++) {
if (((int) bytes[i] & 0xff) < 0x10) {
sb.append('0');
}
sb.append(Long.toString((int) bytes[i] & 0xff, 16));
}
return sb.toString();
}
/**
* Returns the root path of the specified path. Returns a blank string if
* there is no root path.
*
* @param path
* @return root path or blank
*/
public static String getRootPath(String path) {
if (path.indexOf('/') > -1) {
return path.substring(0, path.lastIndexOf('/'));
}
return "";
}
/**
* Returns the path remainder after subtracting the basePath from the
* fullPath.
*
* @param basePath
* @param fullPath
* @return the relative path
*/
public static String getRelativePath(String basePath, String fullPath) {
String bp = basePath.replace('\\', '/').toLowerCase();
String fp = fullPath.replace('\\', '/').toLowerCase();
if (fp.startsWith(bp)) {
String relativePath = fullPath.substring(basePath.length()).replace('\\', '/');
if (relativePath.charAt(0) == '/') {
relativePath = relativePath.substring(1);
}
return relativePath;
}
return fullPath;
}
/**
* Splits the space-separated string into a list of strings.
*
* @param value
* @return list of strings
*/
public static List getStringsFromValue(String value) {
return getStringsFromValue(value, " ");
}
/**
* Splits the string into a list of string by the specified separator.
*
* @param value
* @param separator
* @return list of strings
*/
public static List getStringsFromValue(String value, String separator) {
List strings = new ArrayList();
try {
String[] chunks = value.split(separator + "(?=([^\"]*\"[^\"]*\")*[^\"]*$)");
for (String chunk : chunks) {
chunk = chunk.trim();
if (chunk.length() > 0) {
if (chunk.charAt(0) == '"' && chunk.charAt(chunk.length() - 1) == '"') {
// strip double quotes
chunk = chunk.substring(1, chunk.length() - 1).trim();
}
strings.add(chunk);
}
}
} catch (PatternSyntaxException e) {
throw new RuntimeException(e);
}
return strings;
}
/**
* Validates that a name is composed of letters, digits, or limited other
* characters.
*
* @param name
* @return the first invalid character found or null if string is acceptable
*/
public static Character findInvalidCharacter(String name) {
char[] validChars = { '/', '.', '_', '-', '~' };
for (char c : name.toCharArray()) {
if (!Character.isLetterOrDigit(c)) {
boolean ok = false;
for (char vc : validChars) {
ok |= c == vc;
}
if (!ok) {
return c;
}
}
}
return null;
}
/**
* Simple fuzzy string comparison. This is a case-insensitive check. A
* single wildcard * value is supported.
*
* @param value
* @param pattern
* @return true if the value matches the pattern
*/
public static boolean fuzzyMatch(String value, String pattern) {
if (value.equalsIgnoreCase(pattern)) {
return true;
}
if (pattern.contains("*")) {
boolean prefixMatches = false;
boolean suffixMatches = false;
int wildcard = pattern.indexOf('*');
String prefix = pattern.substring(0, wildcard).toLowerCase();
prefixMatches = value.toLowerCase().startsWith(prefix);
if (pattern.length() > (wildcard + 1)) {
String suffix = pattern.substring(wildcard + 1).toLowerCase();
suffixMatches = value.toLowerCase().endsWith(suffix);
return prefixMatches && suffixMatches;
}
return prefixMatches || suffixMatches;
}
return false;
}
/**
* Compare two repository names for proper group sorting.
*
* @param r1
* @param r2
* @return
*/
public static int compareRepositoryNames(String r1, String r2) {
// sort root repositories first, alphabetically
// then sort grouped repositories, alphabetically
r1 = r1.toLowerCase();
r2 = r2.toLowerCase();
int s1 = r1.indexOf('/');
int s2 = r2.indexOf('/');
if (s1 == -1 && s2 == -1) {
// neither grouped
return r1.compareTo(r2);
} else if (s1 > -1 && s2 > -1) {
// both grouped
return r1.compareTo(r2);
} else if (s1 == -1) {
return -1;
} else if (s2 == -1) {
return 1;
}
return 0;
}
/**
* Sort grouped repository names.
*
* @param list
*/
public static void sortRepositorynames(List list) {
Collections.sort(list, new Comparator() {
@Override
public int compare(String o1, String o2) {
return compareRepositoryNames(o1, o2);
}
});
}
public static String getColor(String value) {
int cs = 0;
for (char c : getMD5(value.toLowerCase()).toCharArray()) {
cs += c;
}
int n = (cs % 360);
float hue = ((float) n) / 360;
return hsvToRgb(hue, 0.90f, 0.65f);
}
public static String hsvToRgb(float hue, float saturation, float value) {
int h = (int) (hue * 6);
float f = hue * 6 - h;
float p = value * (1 - saturation);
float q = value * (1 - f * saturation);
float t = value * (1 - (1 - f) * saturation);
switch (h) {
case 0:
return rgbToString(value, t, p);
case 1:
return rgbToString(q, value, p);
case 2:
return rgbToString(p, value, t);
case 3:
return rgbToString(p, q, value);
case 4:
return rgbToString(t, p, value);
case 5:
return rgbToString(value, p, q);
default:
throw new RuntimeException(
"Something went wrong when converting from HSV to RGB. Input was " + hue + ", "
+ saturation + ", " + value);
}
}
public static String rgbToString(float r, float g, float b) {
String rs = Integer.toHexString((int) (r * 256));
String gs = Integer.toHexString((int) (g * 256));
String bs = Integer.toHexString((int) (b * 256));
return "#" + rs + gs + bs;
}
/**
* Strips a trailing ".git" from the value.
*
* @param value
* @return a stripped value or the original value if .git is not found
*/
public static String stripDotGit(String value) {
if (value.toLowerCase().endsWith(".git")) {
return value.substring(0, value.length() - 4);
}
return value;
}
/**
* Count the number of lines in a string.
*
* @param value
* @return the line count
*/
public static int countLines(String value) {
if (isEmpty(value)) {
return 0;
}
return value.split("\n").length;
}
/**
* Returns the file extension of a path.
*
* @param path
* @return a blank string or a file extension
*/
public static String getFileExtension(String path) {
int lastDot = path.lastIndexOf('.');
if (lastDot > -1) {
return path.substring(lastDot + 1);
}
return "";
}
/**
* Replace all occurences of a substring within a string with
* another string.
*
* From Spring StringUtils.
*
* @param inString String to examine
* @param oldPattern String to replace
* @param newPattern String to insert
* @return a String with the replacements
*/
public static String replace(String inString, String oldPattern, String newPattern) {
StringBuilder sb = new StringBuilder();
int pos = 0; // our position in the old string
int index = inString.indexOf(oldPattern);
// the index of an occurrence we've found, or -1
int patLen = oldPattern.length();
while (index >= 0) {
sb.append(inString.substring(pos, index));
sb.append(newPattern);
pos = index + patLen;
index = inString.indexOf(oldPattern, pos);
}
sb.append(inString.substring(pos));
// remember to append any characters to the right of a match
return sb.toString();
}
/**
* Decodes a string by trying several charsets until one does not throw a
* coding exception. Last resort is to interpret as UTF-8 with illegal
* character substitution.
*
* @param content
* @param charsets optional
* @return a string
*/
public static String decodeString(byte [] content, String... charsets) {
Set sets = new LinkedHashSet();
if (!ArrayUtils.isEmpty(charsets)) {
sets.addAll(Arrays.asList(charsets));
}
String value = null;
sets.addAll(Arrays.asList("UTF-8", "ISO-8859-1", Charset.defaultCharset().name()));
for (String charset : sets) {
try {
Charset cs = Charset.forName(charset);
CharsetDecoder decoder = cs.newDecoder();
CharBuffer buffer = decoder.decode(ByteBuffer.wrap(content));
value = buffer.toString();
break;
} catch (CharacterCodingException e) {
// ignore and advance to the next charset
} catch (IllegalCharsetNameException e) {
// ignore illegal charset names
} catch (UnsupportedCharsetException e) {
// ignore unsupported charsets
}
}
if (value.startsWith("\uFEFF")) {
// strip UTF-8 BOM
return value.substring(1);
}
return value;
}
/**
* Attempt to extract a repository name from a given url using regular
* expressions. If no match is made, then return whatever trails after
* the final / character.
*
* @param regexUrls
* @return a repository path
*/
public static String extractRepositoryPath(String url, String... urlpatterns) {
for (String urlPattern : urlpatterns) {
Pattern p = Pattern.compile(urlPattern);
Matcher m = p.matcher(url);
while (m.find()) {
String repositoryPath = m.group(1);
return repositoryPath;
}
}
// last resort
if (url.lastIndexOf('/') > -1) {
return url.substring(url.lastIndexOf('/') + 1);
}
return url;
}
/**
* Converts a string with \nnn sequences into a UTF-8 encoded string.
* @param input
* @return
*/
public static String convertOctal(String input) {
try {
ByteArrayOutputStream bytes = new ByteArrayOutputStream();
Pattern p = Pattern.compile("(\\\\\\d{3})");
Matcher m = p.matcher(input);
int i = 0;
while (m.find()) {
bytes.write(input.substring(i, m.start()).getBytes("UTF-8"));
// replace octal encoded value
// strip leading \ character
String oct = m.group().substring(1);
bytes.write(Integer.parseInt(oct, 8));
i = m.end();
}
if (bytes.size() == 0) {
// no octal matches
return input;
} else {
if (i < input.length()) {
// add remainder of string
bytes.write(input.substring(i).getBytes("UTF-8"));
}
}
return bytes.toString("UTF-8");
} catch (Exception e) {
e.printStackTrace();
}
return input;
}
/**
* Returns the first path element of a path string. If no path separator is
* found in the path, an empty string is returned.
*
* @param path
* @return the first element in the path
*/
public static String getFirstPathElement(String path) {
if (path.indexOf('/') > -1) {
return path.substring(0, path.indexOf('/')).trim();
}
return "";
}
/**
* Returns the last path element of a path string
*
* @param path
* @return the last element in the path
*/
public static String getLastPathElement(String path) {
if (path.indexOf('/') > -1) {
return path.substring(path.lastIndexOf('/') + 1);
}
return path;
}
/**
* Variation of String.matches() which disregards case issues.
*
* @param regex
* @param input
* @return true if the pattern matches
*/
public static boolean matchesIgnoreCase(String input, String regex) {
Pattern p = Pattern.compile(regex, Pattern.CASE_INSENSITIVE);
Matcher m = p.matcher(input);
return m.matches();
}
/**
* Removes new line and carriage return chars from a string.
* If input value is null an empty string is returned.
*
* @param input
* @return a sanitized or empty string
*/
public static String removeNewlines(String input) {
if (input == null) {
return "";
}
return input.replace('\n',' ').replace('\r', ' ').trim();
}
}