All Downloads are FREE. Search and download functionalities are using the official Maven repository.

nl.hsac.fitnesse.fixture.util.HtmlCleaner Maven / Gradle / Ivy

package nl.hsac.fitnesse.fixture.util;

import org.apache.commons.lang3.StringEscapeUtils;

import java.util.regex.Matcher;
import java.util.regex.Pattern;

/**
 * Helper to remove wiki formatting from strings.
 */
public class HtmlCleaner {
    private static final Pattern LINKPATTERN = Pattern.compile("(.*?)(.*)", Pattern.CASE_INSENSITIVE);
    private static final Pattern IMAGEPATTERN = Pattern.compile("", Pattern.CASE_INSENSITIVE);
    private static final Pattern PRE_FORMATTED_PATTERN = Pattern.compile("
\\s*(.*?)\\s*
", Pattern.DOTALL); /** * Gets a URL from a wiki page value. * @param htmlLink link as present on wiki page. * @return address the link points to (if it is an 'a'), the original link otherwise. */ public String getUrl(String htmlLink) { String result = htmlLink; if (htmlLink != null) { Matcher linkMatcher = LINKPATTERN.matcher(htmlLink); Matcher imgMatcher = IMAGEPATTERN.matcher(htmlLink); if (linkMatcher.matches()) { String href = linkMatcher.group(1); href = StringEscapeUtils.unescapeHtml4(href); result = href + linkMatcher.group(3); } else if (imgMatcher.matches()) { String src = imgMatcher.group(1); result = StringEscapeUtils.unescapeHtml4(src); } } return result; } /** * Removes result of wiki formatting (for e.g. email addresses) if needed. * @param rawValue value as received from FitNesse. * @return rawValue if it was just text or any object, cleaned version if it was not. */ public T cleanupValue(T rawValue) { T cleanValue; if (rawValue instanceof String) { cleanValue = (T) cleanupValue((String) rawValue); } else { cleanValue = rawValue; } return cleanValue; } /** * Removes result of wiki formatting (for e.g. email addresses) if needed. * @param rawValue value as received from Fitnesse. * @return rawValue if it was just text, cleaned version if it was not. */ public String cleanupValue(String rawValue) { String result = null; if (rawValue != null) { Matcher matcher = LINKPATTERN.matcher(rawValue); if (matcher.matches()) { result = matcher.group(2) + matcher.group(3); } else { result = cleanupPreFormatted(rawValue); } } return result; } /** * Removes HTML preformatting (if any). * @param value value (possibly pre-formatted) * @return value without HTML preformatting. */ public String cleanupPreFormatted(String value) { String result = value; if (value != null) { Matcher matcher = PRE_FORMATTED_PATTERN.matcher(value); if (matcher.matches()) { String escapedBody = matcher.group(1); result = StringEscapeUtils.unescapeHtml4(escapedBody); } } return result; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy