All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.thoughtworks.xstream.io.xml.XmlFriendlyNameCoder Maven / Gradle / Ivy

There is a newer version: 0.40.13
Show newest version
/*
 * Copyright (C) 2006 Joe Walnes.
 * Copyright (C) 2006, 2007, 2008, 2009, 2011, 2013 XStream Committers.
 * All rights reserved.
 *
 * The software in this package is published under the terms of the BSD
 * style license a copy of which has been included with this distribution in
 * the LICENSE.txt file.
 *
 * Created on 15. August 2009 by Joerg Schaible, copied from XmlFriendlyReplacer.
 */
package com.thoughtworks.xstream.io.xml;

import com.thoughtworks.xstream.converters.reflection.ObjectAccessException;
import com.thoughtworks.xstream.io.naming.NameCoder;

import java.util.ArrayList;
import java.util.HashMap;
import java.util.Map;


/**
 * Encode and decode tag and attribute names in XML drivers.
 * 

* This NameCoder is designed to ensure the correct encoding and decoding of names used for Java * types and fields to XML tags and attribute names. *

*

* The default replacements are: *

*
    *
  • $ (dollar) chars are replaced with _- (underscore dash) string.
  • *
  • _ (underscore) chars are replaced with __ (double underscore) string.
  • *
  • other characters that are invalid in XML names are encoded with _.XXXX (underscore * dot followed by hex representation of character).
  • *
* * @author Jörg Schaible * @author Mauro Talevi * @author Tatu Saloranta * @author Michael Schnell * @see XML 1.0 name definition * @see XML 1.1 name definition * @see Java * identifier definition * @since 1.4 */ public class XmlFriendlyNameCoder implements NameCoder, Cloneable { private static final IntPair[] XML_NAME_START_CHAR_BOUNDS; private static final IntPair[] XML_NAME_CHAR_EXTRA_BOUNDS; static { class IntPairList extends ArrayList { void add(int min, int max) { super.add(new IntPair(min, max)); } void add(char cp) { super.add(new IntPair(cp, cp)); } } // legal characters in XML names according to // http://www.w3.org/TR/REC-xml/#NT-Name and // http://www.w3.org/TR/xml11/#NT-Name IntPairList list = new IntPairList(); list.add(':'); list.add('A', 'Z'); list.add('a', 'z'); list.add('_'); list.add(0xC0, 0xD6); list.add(0xD8, 0xF6); list.add(0xF8, 0x2FF); list.add(0x370, 0x37D); list.add(0x37F, 0x1FFF); list.add(0x200C, 0x200D); list.add(0x2070, 0x218F); list.add(0x2C00, 0x2FEF); list.add(0x3001, 0xD7FF); list.add(0xF900, 0xFDCF); list.add(0xFDF0, 0xFFFD); list.add(0x10000, 0xEFFFF); XML_NAME_START_CHAR_BOUNDS = (IntPair[])list.toArray(new IntPair[list.size()]); list.clear(); list.add('-'); list.add('.'); list.add('0', '9'); list.add('\u00b7'); list.add(0x0300, 0x036F); list.add(0x203F, 0x2040); XML_NAME_CHAR_EXTRA_BOUNDS = (IntPair[])list.toArray(new IntPair[list.size()]); } private final String dollarReplacement; private final String escapeCharReplacement; private transient Map escapeCache; private transient Map unescapeCache; private final String hexPrefix; /** * Construct a new XmlFriendlyNameCoder. * * @since 1.4 */ public XmlFriendlyNameCoder() { this("_-", "__"); } /** * Construct a new XmlFriendlyNameCoder with custom replacement strings for dollar and the * escape character. * * @param dollarReplacement * @param escapeCharReplacement * @since 1.4 */ public XmlFriendlyNameCoder(String dollarReplacement, String escapeCharReplacement) { this(dollarReplacement, escapeCharReplacement, "_."); } /** * Construct a new XmlFriendlyNameCoder with custom replacement strings for dollar, the * escape character and the prefix for hexadecimal encoding of invalid characters in XML * names. * * @param dollarReplacement * @param escapeCharReplacement * @since 1.4 */ public XmlFriendlyNameCoder( String dollarReplacement, String escapeCharReplacement, String hexPrefix) { this.dollarReplacement = dollarReplacement; this.escapeCharReplacement = escapeCharReplacement; this.hexPrefix = hexPrefix; readResolve(); } /** * {@inheritDoc} */ public String decodeAttribute(String attributeName) { return decodeName(attributeName); } /** * {@inheritDoc} */ public String decodeNode(String elementName) { return decodeName(elementName); } /** * {@inheritDoc} */ public String encodeAttribute(String name) { return encodeName(name); } /** * {@inheritDoc} */ public String encodeNode(String name) { return encodeName(name); } private String encodeName(String name) { String s = (String)escapeCache.get(name); if (s == null) { final int length = name.length(); // First, fast (common) case: nothing to escape int i = 0; for (; i < length; i++ ) { char c = name.charAt(i); if (c == '$' || c == '_' || c <= 27 || c >= 127) { break; } } if (i == length) { return name; } // Otherwise full processing final StringBuffer result = new StringBuffer(length + 8); // We know first N chars are safe if (i > 0) { result.append(name.substring(0, i)); } for (; i < length; i++ ) { char c = name.charAt(i); if (c == '$') { result.append(dollarReplacement); } else if (c == '_') { result.append(escapeCharReplacement); } else if ((i == 0 && !isXmlNameStartChar(c)) || (i > 0 && !isXmlNameChar(c))) { result.append(hexPrefix); if (c < 16) result.append("000"); else if (c < 256) result.append("00"); else if (c < 4096) result.append("0"); result.append(Integer.toHexString(c)); } else { result.append(c); } } s = result.toString(); escapeCache.put(name, s); } return s; } private String decodeName(String name) { String s = (String)unescapeCache.get(name); if (s == null) { final char dollarReplacementFirstChar = dollarReplacement.charAt(0); final char escapeReplacementFirstChar = escapeCharReplacement.charAt(0); final char hexPrefixFirstChar = hexPrefix.charAt(0); final int length = name.length(); // First, fast (common) case: nothing to decode int i = 0; for (; i < length; i++ ) { char c = name.charAt(i); // We'll do a quick check for potential match if (c == dollarReplacementFirstChar || c == escapeReplacementFirstChar || c == hexPrefixFirstChar) { // and if it might be a match, just quit, will check later on break; } } if (i == length) { return name; } // Otherwise full processing final StringBuffer result = new StringBuffer(length + 8); // We know first N chars are safe if (i > 0) { result.append(name.substring(0, i)); } for (; i < length; i++ ) { char c = name.charAt(i); if (c == dollarReplacementFirstChar && name.startsWith(dollarReplacement, i)) { i += dollarReplacement.length() - 1; result.append('$'); } else if (c == hexPrefixFirstChar && name.startsWith(hexPrefix, i)) { i += hexPrefix.length(); c = (char)Integer.parseInt(name.substring(i, i + 4), 16); i += 3; result.append(c); } else if (c == escapeReplacementFirstChar && name.startsWith(escapeCharReplacement, i)) { i += escapeCharReplacement.length() - 1; result.append('_'); } else { result.append(c); } } s = result.toString(); unescapeCache.put(name, s); } return s; } public Object clone() { try { XmlFriendlyNameCoder coder = (XmlFriendlyNameCoder)super.clone(); coder.readResolve(); return coder; } catch (CloneNotSupportedException e) { throw new ObjectAccessException("Cannot clone XmlFriendlyNameCoder", e); } } private Object readResolve() { escapeCache = createCacheMap(); unescapeCache = createCacheMap(); return this; } protected Map createCacheMap() { return new HashMap(); } private static class IntPair { int min; int max; public IntPair(int min, int max) { this.min = min; this.max = max; } } private static boolean isXmlNameStartChar(int cp) { return isInNameCharBounds(cp, XML_NAME_START_CHAR_BOUNDS); } private static boolean isXmlNameChar(int cp) { if (isXmlNameStartChar(cp)) { return true; } return isInNameCharBounds(cp, XML_NAME_CHAR_EXTRA_BOUNDS); } private static boolean isInNameCharBounds(int cp, IntPair[] nameCharBounds) { for (int i = 0; i < nameCharBounds.length; ++i) { IntPair p = nameCharBounds[i]; if (cp >= p.min && cp <= p.max) { return true; } } return false; } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy