All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.frameworkset.util.HtmlUtils Maven / Gradle / Ivy

/*
 *  Copyright 2008 biaoping.yin
 *
 *  Licensed under the Apache License, Version 2.0 (the "License");
 *  you may not use this file except in compliance with the License.
 *  You may obtain a copy of the License at
 *
 *      http://www.apache.org/licenses/LICENSE-2.0
 *
 *  Unless required by applicable law or agreed to in writing, software
 *  distributed under the License is distributed on an "AS IS" BASIS,
 *  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 *  See the License for the specific language governing permissions and
 *  limitations under the License.
 */
package com.frameworkset.util;


/**
 * 

Title: HtmlUtils.java

*

Description:

*

bboss workgroup

*

Copyright (c) 2008

* @Date 2010-9-28 * @author biaoping.yin * @version 1.0 */ public abstract class HtmlUtils { /** * Shared instance of pre-parsed HTML character entity references. */ private static final HtmlCharacterEntityReferences characterEntityReferences = new HtmlCharacterEntityReferences(); /** * Turn special characters into HTML character references. * Handles complete character set defined in HTML 4.01 recommendation. *

Escapes all special characters to their corresponding * entity reference (e.g. <). *

Reference: * * http://www.w3.org/TR/html4/sgml/entities.html * * @param input the (unescaped) input string * @return the escaped string */ public static String htmlEscape(String input) { if (input == null) { return null; } StringBuilder escaped = new StringBuilder(input.length() * 2); for (int i = 0; i < input.length(); i++) { char character = input.charAt(i); String reference = characterEntityReferences.convertToReference(character); if (reference != null) { escaped.append(reference); } else { escaped.append(character); } } return escaped.toString(); } /** * Turn special characters into HTML character references. * Handles complete character set defined in HTML 4.01 recommendation. *

Escapes all special characters to their corresponding numeric * reference in decimal format (&#Decimal;). *

Reference: * * http://www.w3.org/TR/html4/sgml/entities.html * * @param input the (unescaped) input string * @return the escaped string */ public static String htmlEscapeDecimal(String input) { if (input == null) { return null; } StringBuilder escaped = new StringBuilder(input.length() * 2); for (int i = 0; i < input.length(); i++) { char character = input.charAt(i); if (characterEntityReferences.isMappedToReference(character)) { escaped.append(HtmlCharacterEntityReferences.DECIMAL_REFERENCE_START); escaped.append((int) character); escaped.append(HtmlCharacterEntityReferences.REFERENCE_END); } else { escaped.append(character); } } return escaped.toString(); } /** * Turn special characters into HTML character references. * Handles complete character set defined in HTML 4.01 recommendation. *

Escapes all special characters to their corresponding numeric * reference in hex format (&#xHex;). *

Reference: * * http://www.w3.org/TR/html4/sgml/entities.html * * @param input the (unescaped) input string * @return the escaped string */ public static String htmlEscapeHex(String input) { if (input == null) { return null; } StringBuilder escaped = new StringBuilder(input.length() * 2); for (int i = 0; i < input.length(); i++) { char character = input.charAt(i); if (characterEntityReferences.isMappedToReference(character)) { escaped.append(HtmlCharacterEntityReferences.HEX_REFERENCE_START); escaped.append(Integer.toString((int) character, 16)); escaped.append(HtmlCharacterEntityReferences.REFERENCE_END); } else { escaped.append(character); } } return escaped.toString(); } /** * Turn HTML character references into their plain text UNICODE equivalent. *

Handles complete character set defined in HTML 4.01 recommendation * and all reference types (decimal, hex, and entity). *

Correctly converts the following formats: *

* &#Entity; - (Example: &amp;) case sensitive * &#Decimal; - (Example: &#68;)
* &#xHex; - (Example: &#xE5;) case insensitive
*
* Gracefully handles malformed character references by copying original * characters as is when encountered.

*

Reference: * * http://www.w3.org/TR/html4/sgml/entities.html * * @param input the (escaped) input string * @return the unescaped string */ public static String htmlUnescape(String input) { if (input == null) { return null; } return new HtmlCharacterEntityDecoder(characterEntityReferences, input).decode(); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy