291 lines
9.6 KiB
Java
Raw Normal View History

2023-03-13 14:26:03 +08:00
/*
* Copyright 2022-2023 the original author or authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* https://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
2023-02-24 11:10:27 +08:00
package xyz.zhouxy.plusone.commons.util;
2023-06-27 00:24:22 +08:00
import java.util.Arrays;
import java.util.Map;
2023-06-27 00:07:19 +08:00
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import javax.annotation.Nullable;
2023-06-27 00:07:19 +08:00
import com.google.common.base.Preconditions;
2023-05-31 20:01:35 +08:00
2023-06-27 00:24:22 +08:00
import xyz.zhouxy.plusone.commons.collection.SafeConcurrentHashMap;
2023-06-27 00:07:19 +08:00
/**
* 封装一些常用的正则操作并可以缓存 {@link Pattern} 实例以复用最多缓存 256
*
* @author ZhouXY
*
*/
public final class RegexUtil {
2023-02-24 11:10:27 +08:00
2023-06-27 00:07:19 +08:00
private static final int DEFAULT_CACHE_INITIAL_CAPACITY = 64;
private static final int MAX_CACHE_SIZE = 256;
2023-06-27 00:24:22 +08:00
private static final Map<String, Pattern> PATTERN_CACHE = new SafeConcurrentHashMap<>(
2023-06-27 00:07:19 +08:00
DEFAULT_CACHE_INITIAL_CAPACITY);
2023-02-24 11:10:27 +08:00
2023-06-27 00:07:19 +08:00
/**
* 获取 {@link Pattern} 实例
*
* @param pattern 正则表达式
* @param cachePattern 是否缓存 {@link Pattern} 实例
* @return {@link Pattern} 实例
*/
public static Pattern getPattern(final String pattern, final boolean cachePattern) {
Preconditions.checkNotNull(pattern, "The pattern can not be null.");
Pattern result = PATTERN_CACHE.get(pattern);
if (result == null) {
result = Pattern.compile(pattern);
if (cachePattern && PATTERN_CACHE.size() < MAX_CACHE_SIZE) {
PATTERN_CACHE.putIfAbsent(pattern, result);
result = PATTERN_CACHE.get(pattern);
}
}
return result;
}
2023-06-27 00:07:19 +08:00
/**
* 获取 {@link Pattern} 实例不缓存
*
* @param pattern 正则表达式
* @return {@link Pattern} 实例
*/
public static Pattern getPattern(final String pattern) {
Preconditions.checkNotNull(pattern, "The pattern can not be null.");
Pattern result = PATTERN_CACHE.get(pattern);
if (result == null) {
result = Pattern.compile(pattern);
}
return result;
}
2023-06-27 00:07:19 +08:00
/**
* 将各个正则表达式转为 {@link Pattern} 实例
*
* @param patterns 正则表达式
* @param cachePattern 是否缓存 {@link Pattern} 实例
2023-06-27 00:24:22 +08:00
* @return {@link Pattern} 实例数组
2023-06-27 00:07:19 +08:00
*/
public static Pattern[] getPatterns(final String[] patterns, final boolean cachePattern) {
Preconditions.checkNotNull(patterns, "The patterns can not be null.");
2023-06-27 00:24:22 +08:00
return Arrays.stream(patterns)
.map(pattern -> getPattern(pattern, cachePattern))
.toArray(Pattern[]::new);
}
2023-06-27 00:07:19 +08:00
/**
* 将各个正则表达式转为 {@link Pattern} 实例不缓存
*
* @param patterns 正则表达式
* @return {@link Pattern} 实例数组
*/
public static Pattern[] getPatterns(final String[] patterns) {
Preconditions.checkNotNull(patterns, "The patterns can not be null.");
2023-06-27 00:24:22 +08:00
return Arrays.stream(patterns)
.map(RegexUtil::getPattern)
.toArray(Pattern[]::new);
2023-02-24 11:10:27 +08:00
}
2023-06-27 00:07:19 +08:00
/**
* 手动缓存 Pattern 实例
*
* @param pattern 要缓存的 {@link Pattern} 实例
* @return 缓存的 Pattern 实例如果缓存已满则返回 {@code null}
*/
public static Pattern cachePattern(final Pattern pattern) {
if (PATTERN_CACHE.size() >= MAX_CACHE_SIZE) {
return null;
2023-02-24 11:10:27 +08:00
}
2023-06-27 00:07:19 +08:00
final String patternStr = pattern.pattern();
PATTERN_CACHE.putIfAbsent(patternStr, pattern);
return PATTERN_CACHE.get(patternStr);
}
/**
* 判断 {@code input} 是否匹配 {@code pattern}
*
* @param input 输入
* @param pattern 正则
* @return 判断结果
*/
public static boolean matches(@Nullable final CharSequence input, final Pattern pattern) {
Preconditions.checkNotNull(pattern, "The pattern can not be null.");
return input != null && pattern.matcher(input).matches();
2023-02-24 11:10:27 +08:00
}
2023-06-27 00:07:19 +08:00
/**
* 判断 {@code input} 是否匹配 {@code patterns} 中的一个
*
* @param input 输入
* @param patterns 正则
* @return 判断结果
*/
public static boolean matchOne(@Nullable final CharSequence input, final Pattern[] patterns) {
Preconditions.checkNotNull(patterns, "The patterns can not be null.");
if (input == null) {
return false;
}
for (Pattern pattern : patterns) {
2023-04-25 09:06:00 +08:00
if (matches(input, pattern)) {
return true;
}
}
return false;
}
2023-06-27 00:07:19 +08:00
/**
* 判断 {@code input} 是否匹配全部正则
*
* @param input 输入
* @param patterns 正则
* @return 判断结果
*/
public static boolean matchAll(@Nullable final CharSequence input, final Pattern[] patterns) {
Preconditions.checkNotNull(patterns, "The patterns can not be null.");
if (input == null) {
return false;
2023-02-24 11:10:27 +08:00
}
for (Pattern pattern : patterns) {
2023-04-25 09:06:00 +08:00
if (!matches(input, pattern)) {
return false;
}
}
return true;
}
2023-06-27 00:07:19 +08:00
/**
* 判断 {@code input} 是否匹配 {@code pattern}
*
* @param input 输入
* @param pattern 正则表达式
* @param cachePattern 是否缓存 {@link Pattern} 实例
* @return 判断结果
*/
public static boolean matches(@Nullable final CharSequence input, final String pattern,
final boolean cachePattern) {
return matches(input, getPattern(pattern, cachePattern));
}
/**
* 判断 {@code input} 是否匹配 {@code pattern}不缓存 {@link Pattern} 实例
*
* @param input 输入
* @param pattern 正则表达式
* @return 判断结果
*/
public static boolean matches(@Nullable final CharSequence input, final String pattern) {
return matches(input, getPattern(pattern));
}
/**
* 判断 {@code input} 是否匹配 {@code patterns} 中的一个
*
* @param input 输入
* @param patterns 正则表达式
* @param cachePattern 是否缓存 {@link Pattern} 实例
* @return 判断结果
*/
public static boolean matchOne(@Nullable final CharSequence input, final String[] patterns,
final boolean cachePattern) {
final Pattern[] patternSet = getPatterns(patterns, cachePattern);
return matchOne(input, patternSet);
}
/**
* 判断 {@code input} 是否匹配 {@code patterns} 中的一个不缓存 {@link Pattern} 实例
*
* @param input 输入
* @param patterns 正则表达式
* @return 判断结果
*/
public static boolean matchOne(@Nullable final CharSequence input, final String[] patterns) {
final Pattern[] patternSet = getPatterns(patterns);
return matchOne(input, patternSet);
}
/**
* 判断 {@code input} 是否匹配全部正则
*
* @param input 输入
* @param patterns 正则表达式
* @param cachePattern 是否缓存 {@link Pattern} 实例
* @return 判断结果
*/
public static boolean matchAll(@Nullable final CharSequence input, final String[] patterns,
final boolean cachePattern) {
final Pattern[] patternSet = getPatterns(patterns, cachePattern);
return matchAll(input, patternSet);
}
/**
* 判断 {@code input} 是否匹配全部正则不缓存 {@link Pattern} 实例
*
* @param input 输入
* @param patterns 正则表达式
* @return 判断结果
*/
public static boolean matchAll(@Nullable final CharSequence input, final String[] patterns) {
final Pattern[] patternSet = getPatterns(patterns);
return matchAll(input, patternSet);
}
/**
* 生成匹配器
*
* @param input 输入
* @param pattern 正则
* @return 结果
*/
public static Matcher getMatcher(final CharSequence input, final Pattern pattern) {
Preconditions.checkNotNull(input, "The input can not be null");
Preconditions.checkNotNull(pattern, "The pattern can not be null");
return pattern.matcher(input);
}
/**
* 生成匹配器
*
* @param input 输入
* @param pattern 正则表达式
* @param cachePattern 是否缓存 {@link Pattern} 实例
* @return 结果
*/
public static Matcher getMatcher(final CharSequence input, final String pattern, boolean cachePattern) {
Preconditions.checkNotNull(input, "The input can not be null");
return getPattern(pattern, cachePattern).matcher(input);
}
/**
* 生成匹配器不缓存 {@link Pattern} 实例
*
* @param input 输入
* @param pattern 正则表达式
* @return 结果
*/
public static Matcher getMatcher(final CharSequence input, final String pattern) {
Preconditions.checkNotNull(input, "The input can not be null");
return getPattern(pattern).matcher(input);
}
2023-02-24 11:10:27 +08:00
private RegexUtil() {
2023-06-27 00:07:19 +08:00
// 不允许实例化
2023-02-24 11:10:27 +08:00
throw new IllegalStateException("Utility class");
}
}