PandaLib/pandalib-util/src/main/java/fr/pandacube/lib/util/StringUtil.java

152 lines
5.7 KiB
Java
Raw Normal View History

package fr.pandacube.lib.util;
import java.util.Arrays;
2018-07-21 17:57:44 +02:00
import java.util.List;
2022-08-13 00:55:44 +02:00
import java.util.function.Predicate;
import java.util.function.UnaryOperator;
2022-08-13 00:55:44 +02:00
import java.util.regex.Matcher;
import java.util.regex.Pattern;
2018-07-21 17:57:44 +02:00
/**
* Provides various methods to manipulate Strings.
*/
public class StringUtil {
/**
* Format the provided double, omitting the decimal part if the provided double is strictly equals to a long value.
* @param d the value to convert to string.
* @return a string representation of the double value.
*/
public static String formatDouble(double d) {
if (d == (long) d)
return String.format("%d", (long) d);
return String.valueOf(d);
}
/**
* Counts the number of occurrence of a specified character in a string.
* @param string the character sequence to search into.
* @param character the character to count.
* @return the number of occurrence of
*/
public static int countOccurrences(CharSequence string, char character) {
int count = 0;
for (char c : string.toString().toCharArray()) {
if (c == character) {
count++;
}
}
return count;
}
/**
* Do like {@link String#join(CharSequence, Iterable)}, but the last separator is different from the others.
* It is useful when enumerating things in a sentence, for instance :
* <code>"a thing<u>, </u>a thing<u> and </u>a thing"</code>
* (the coma being the usual separator, and {@code " and "} being the final separator).
* @param regularSeparator the separator used everywhere except between the two last strings to join.
* @param finalSeparator the separator used between the two last strings to join.
* @param strings the strings to join.
* @return a new string with all the provided {@code strings} joined using the separators.
*/
public static String joinGrammatically(CharSequence regularSeparator, CharSequence finalSeparator, List<String> strings) {
2018-07-21 17:57:44 +02:00
int size = strings == null ? 0 : strings.size();
return switch (size) {
case 0 -> "";
case 1 -> strings.get(0);
default -> String.join(regularSeparator, strings.subList(0, --size)) + finalSeparator + strings.get(size);
};
2018-07-21 17:57:44 +02:00
}
/**
* Create a {@link String} that repeats the base character n times.
* @param base the base character.
* @param n the number of repetition.
* @return a {@link String} that repeats the base character n times.
*/
public static String repeat(char base, int n) {
char[] chars = new char[n];
Arrays.fill(chars, base);
return String.valueOf(chars);
2020-04-06 00:10:14 +02:00
}
2022-08-13 00:55:44 +02:00
private static final Pattern endingNumber = Pattern.compile("(\\d+)$");
/**
* Generate a name based on the original name, but that does not conflit with another one, according to the
2022-08-13 00:55:44 +02:00
* provided predicate.
* It can be used to add an entry in a map when the key already exists, and it is ok to modify the added key to
2022-08-13 00:55:44 +02:00
* not erase the previous data.
* This situation can be compared to when a file is added to a directory but another file with the same name exists,
* so the new file have a suffix number to make the file name different.
* <p>
* Be aware that this method may run an infinite loop if the predicate continuously returns true.
* @param originalName the original conflicting name.
* @param conflictTester a predicate that test if a generated name stills conflict with a set of name
* @return the original name, with a suffix number (ex: {@code "original1"}).
*/
public static String fixConflictName(String originalName, Predicate<String> conflictTester) {
int suffix = 1;
Matcher endingMatcher = endingNumber.matcher(originalName);
if (endingMatcher.find()) {
suffix = Integer.parseInt(endingMatcher.group(1)) + 1;
originalName = originalName.substring(0, endingMatcher.start());
}
for (;; suffix++) {
String newStr = originalName + suffix;
if (!conflictTester.test(newStr))
return newStr;
}
}
/**
* Wraps the provided {@link UnaryOperator} of integer into an {@link UnaryOperator} of String parsing the input
* string to int and converting back the return value to String.
* @param operator the {@link UnaryOperator} to warp.
* @return an {@link UnaryOperator} of String.
*/
public static UnaryOperator<String> wrapParsingInt(UnaryOperator<Integer> operator) {
return s -> Integer.toString(operator.apply(Integer.parseInt(s)));
}
/**
* Wraps the provided {@link UnaryOperator} of long into an {@link UnaryOperator} of String parsing the input
* string to long and converting back the return value to String.
* @param operator the {@link UnaryOperator} to warp.
* @return an {@link UnaryOperator} of String.
*/
public static UnaryOperator<String> wrapParsingLong(UnaryOperator<Long> operator) {
return s -> Long.toString(operator.apply(Long.parseLong(s)));
}
/**
* Generate a {@link Pattern} with extra wrapping regex around the provided one to consider a sentence (like a chat
* message). For instance, the returned pattern will only match the expression at the beginning or end of sentence,
* or separated by the rest of it with space or another non-letter character.
* @param wordPattern the regex pattern to wrap.
* @param caseInsensitive if the pattern must match ignoring case.
* @return a {@link Pattern}. The matching will match 3 groups. The first group is the eventual non-letter separator
* before the matched word, the second one is the actual word, and the last one is the eventual non-letter separator
* after the matched word. Any additional pattern group between the 2nd and the last one are those provided in the
* wordPattern.
*/
public static Pattern asPatternInSentence(String wordPattern, boolean caseInsensitive) {
return Pattern.compile((caseInsensitive ? "(?i)" : "") + "(\\P{L}|^)(" + wordPattern + ")(\\P{L}|$)");
}
private StringUtil() {}
}