com.frameworkset.util.RegexUtil Maven / Gradle / Ivy
package com.frameworkset.util;
import java.util.ArrayList;
import java.util.List;
import org.apache.oro.text.regex.MalformedPatternException;
import org.apache.oro.text.regex.MatchResult;
import org.apache.oro.text.regex.Pattern;
import org.apache.oro.text.regex.PatternCompiler;
import org.apache.oro.text.regex.PatternMatcher;
import org.apache.oro.text.regex.PatternMatcherInput;
import org.apache.oro.text.regex.Perl5Compiler;
import org.apache.oro.text.regex.Perl5Matcher;
import org.apache.oro.text.regex.Perl5Substitution;
import org.apache.oro.text.regex.Util;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* Title:
*
* Description:
*
* Copyright: Copyright (c) 2005
*
* Company:
*
* @author biaoping.yin
* @version 1.0
*/
public class RegexUtil {
private static Logger log = LoggerFactory.getLogger(RegexUtil.class);
public static final int default_mask = Perl5Compiler.SINGLELINE_MASK | Perl5Compiler.DEFAULT_MASK;
public static String[] parser(String src, String regex) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
boolean match = matcher.matches(src, pattern);
if (match) {
result = matcher.getMatch();
int size = result.groups() - 1;
tokens = new String[size];
for (int i = 0; i < size; i++) {
tokens[i] = result.group(i + 1);
}
}
return tokens;
}
/**
* 从匹配regex的src字符串中提取部分子字符串
* @param src
* @param regex
* @return
*/
public static String[] matchWithPatternMatcherInput(String src, String regex) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
List sets = new ArrayList();
PatternMatcherInput input = new PatternMatcherInput(src);
while (matcher.matches(input, pattern)) {
result = matcher.getMatch();
int size = result.groups();
for (int i = 1; i < size; i++) {
sets.add(result.group(i));
}
}
tokens = new String[sets.size()];
sets.toArray(tokens);
return tokens;
}
public static String[] match(String src, String regex) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
if(matcher.matches(src, pattern)) {
result = matcher.getMatch();
int size = result.groups() - 1;
tokens = new String[size];
for (int i = 0; i < size; i++) {
tokens[i] = result.group(i + 1);
}
}
return tokens;
}
/**
* 从src中提取包含模式regex的子字符串
* @param src
* @param regex
* @return
*/
public static String[] containWithPatternMatcherInput(String src, String regex) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
List sets = new ArrayList();
PatternMatcherInput input = new PatternMatcherInput(src);
while (matcher.contains(input, pattern)) {
result = matcher.getMatch();
int size = result.groups();
for (int i = 1; i < size; i++) {
sets.add(result.group(i));
}
}
tokens = new String[sets.size()];
sets.toArray(tokens);
return tokens;
}
/**
* 从src中提取包含模式regex的子字符串
* @param src
* @param regex
* @return
*/
public static String[] containWithPatternMatcherInput(String src, String regex,int mask) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
List sets = new ArrayList();
PatternMatcherInput input = new PatternMatcherInput(src);
while (matcher.contains(input, pattern)) {
result = matcher.getMatch();
int size = result.groups();
for (int i = 1; i < size; i++) {
sets.add(result.group(i));
}
}
tokens = new String[sets.size()];
sets.toArray(tokens);
return tokens;
}
/**
* 从串src中析取匹配regex模式的所有字符串,并且用substitution替换匹配上模式的子符串
* @param src
* @param regex
* @param substitution
* @return String[][]二维数组,第一维表示替换后的src,第二维表示匹配regex的所有的子串数组
*/
public static String[][] contain2ndReplaceWithPatternMatcherInput(String src, String regex,String substitution) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
List sets = new ArrayList();
PatternMatcherInput input = new PatternMatcherInput(src);
while (matcher.contains(input, pattern)) {
result = matcher.getMatch();
int size = result.groups();
for (int i = 1; i < size; i++) {
sets.add(result.group(i));
}
}
String[][] retvalue = null;
String newsrc = src;
if(sets.size() > 0)
{
newsrc = Util.substitute(matcher, pattern, new Perl5Substitution(substitution),
src, Util.SUBSTITUTE_ALL);
}
tokens = new String[sets.size()];
sets.toArray(tokens);
retvalue = new String[][] {{newsrc},tokens};
return retvalue;
}
/**
* 从串src中析取匹配regex模式的所有字符串,并且用substitution替换匹配上模式的子符串
* @param src
* @param regex
* @param substitution
* @return String[][]二维数组,第一维表示替换后的src,第二维表示匹配regex的所有的子串数组
*/
public static String[][] contain2ndReplaceWithPatternMatcherInput(String src, String regex,String substitution,int MASK) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
MASK);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
List sets = new ArrayList();
PatternMatcherInput input = new PatternMatcherInput(src);
while (matcher.contains(input, pattern)) {
result = matcher.getMatch();
int size = result.groups();
for (int i = 1; i < size; i++) {
sets.add(result.group(i));
}
}
String[][] retvalue = null;
String newsrc = src;
if(sets.size() > 0)
{
newsrc = Util.substitute(matcher, pattern, new Perl5Substitution(substitution),
src, Util.SUBSTITUTE_ALL);
}
tokens = new String[sets.size()];
sets.toArray(tokens);
retvalue = new String[][] {{newsrc},tokens};
return retvalue;
}
/**
* 从包含
* @param src
* @param regex
* @return
*/
public static String[] contain(String src, String regex) {
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return null;
}
PatternMatcher matcher = new Perl5Matcher();
MatchResult result = null;
String[] tokens = null;
if (matcher.contains(src, pattern)) {
result = matcher.getMatch();
int size = result.groups() - 1;
tokens = new String[size];
for (int i = 0; i < size; i++) {
tokens[i] = result.group(i + 1);
}
}
return tokens;
}
public static boolean isContain(String src, String regex) {
if(src == null )
return false;
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return false;
}
PatternMatcher matcher = new Perl5Matcher();
return matcher.contains(src, pattern);
}
public RegexUtil() {
}
/**
* 检查src与正则表达式regex匹配结果
* @param src String
* @param regex String
* @return boolean
*/
public static boolean isMatch(String src, String regex) {
if(src == null )
return false;
boolean flag = false;
String patternStr = regex;
/**
* 编译正则表达式patternStr,并用该表达式与传入的src字符串进行模式匹配,
* 如果匹配正确,则从匹配对象中提取出以上定义好的6部分,存放到数组中并返回
* 该数组
*/
PatternCompiler compiler = new Perl5Compiler();
Pattern pattern = null;
try {
pattern = compiler.compile(patternStr,
default_mask);
} catch (MalformedPatternException e) {
e.printStackTrace();
return false;
}
PatternMatcher matcher = new Perl5Matcher();
// log.debug("src:" + src);;
// log.debug("pattern:" + pattern);
// log.debug("regex:" + regex);
flag = matcher.matches(src, pattern);
return flag;
}
/**
* 将content中符合模式pattern的字符串替换为newstr字符串
* 暂未实现
* @param content
* @param pattern
* @param newstr
*/
public static void replace(String content,String pattern,String newstr)
{
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy