nl.hsac.fitnesse.fixture.util.HtmlCleaner Maven / Gradle / Ivy
package nl.hsac.fitnesse.fixture.util;
import org.apache.commons.lang3.StringEscapeUtils;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
/**
* Helper to remove wiki formatting from strings.
*/
public class HtmlCleaner {
private static final Pattern LINKPATTERN = Pattern.compile("(.*?)(.*)", Pattern.CASE_INSENSITIVE);
private static final Pattern IMAGEPATTERN = Pattern.compile("", Pattern.CASE_INSENSITIVE);
private static final Pattern PRE_FORMATTED_PATTERN = Pattern.compile("\\s*(.*?)\\s*
", Pattern.DOTALL);
/**
* Gets a URL from a wiki page value.
* @param htmlLink link as present on wiki page.
* @return address the link points to (if it is an 'a'), the original link otherwise.
*/
public String getUrl(String htmlLink) {
String result = htmlLink;
if (htmlLink != null) {
Matcher linkMatcher = LINKPATTERN.matcher(htmlLink);
Matcher imgMatcher = IMAGEPATTERN.matcher(htmlLink);
if (linkMatcher.matches()) {
String href = linkMatcher.group(1);
href = StringEscapeUtils.unescapeHtml4(href);
result = href + linkMatcher.group(3);
} else if (imgMatcher.matches()) {
String src = imgMatcher.group(1);
result = StringEscapeUtils.unescapeHtml4(src);
}
}
return result;
}
/**
* Removes result of wiki formatting (for e.g. email addresses) if needed.
* @param rawValue value as received from FitNesse.
* @return rawValue if it was just text or any object, cleaned version if it was not.
*/
public T cleanupValue(T rawValue) {
T cleanValue;
if (rawValue instanceof String) {
cleanValue = (T) cleanupValue((String) rawValue);
} else {
cleanValue = rawValue;
}
return cleanValue;
}
/**
* Removes result of wiki formatting (for e.g. email addresses) if needed.
* @param rawValue value as received from Fitnesse.
* @return rawValue if it was just text, cleaned version if it was not.
*/
public String cleanupValue(String rawValue) {
String result = null;
if (rawValue != null) {
Matcher matcher = LINKPATTERN.matcher(rawValue);
if (matcher.matches()) {
result = matcher.group(2) + matcher.group(3);
} else {
result = cleanupPreFormatted(rawValue);
}
}
return result;
}
/**
* Removes HTML preformatting (if any).
* @param value value (possibly pre-formatted)
* @return value without HTML preformatting.
*/
public String cleanupPreFormatted(String value) {
String result = value;
if (value != null) {
Matcher matcher = PRE_FORMATTED_PATTERN.matcher(value);
if (matcher.matches()) {
String escapedBody = matcher.group(1);
result = StringEscapeUtils.unescapeHtml4(escapedBody);
}
}
return result;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy