All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.tapestry.util.text.MarkupCharacterTranslator Maven / Gradle / Ivy

// Copyright 2004, 2005 The Apache Software Foundation
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package org.apache.tapestry.util.text;

/**
 * An object that encodes a character according to rules of the HTML specification, 
 * so that it will be properly parsed by a browser irrespectively of the character
 * encoding used in the HTML output.
 * 
 * @author mb
 * @since 4.0
 */
public class MarkupCharacterTranslator implements ICharacterTranslator
{
    private static final String SAFE_CHARACTERS =
        "01234567890"
            + "abcdefghijklmnopqrstuvwxyz"
            + "ABCDEFGHIJKLMNOPQRSTUVWXYZ"
            + "\t\n\r !#$%'()*+,-./:;=?@[\\]^_`{|}~";

    private static final String[][] ENTITIES = {
    	{ "\"", """ }, 
		{ "<", "<" },
		{ ">", ">" },
		{ "&", "&" }
    };
    
    private static final ICharacterMatcher SAFE_MATCHER = new AsciiCharacterMatcher(SAFE_CHARACTERS);
    private static final ICharacterTranslator ENTITY_TRANSLATOR = new AsciiCharacterTranslator(ENTITIES);
    
    private boolean _encodeNonAscii;
    private ICharacterMatcher _safeMatcher;
    private ICharacterTranslator _entityTranslator;
	
    public MarkupCharacterTranslator()
    {
    	this(true);
    }
    
    public MarkupCharacterTranslator(boolean encodeNonAscii)
    {
    	this(encodeNonAscii, SAFE_MATCHER, ENTITY_TRANSLATOR);
    }
    
    public MarkupCharacterTranslator(boolean encodeNonAscii, ICharacterMatcher safeMatcher, ICharacterTranslator entityTranslator)
    {
    	_encodeNonAscii = encodeNonAscii;
    	_safeMatcher = safeMatcher;
    	_entityTranslator = entityTranslator;
    }

    public MarkupCharacterTranslator(boolean encodeNonAscii, String safeCharacters, String[][] entities)
    {
    	_encodeNonAscii = encodeNonAscii;
    	_safeMatcher = new AsciiCharacterMatcher(safeCharacters);
    	_entityTranslator = new AsciiCharacterTranslator(entities);
    }
    
	/**
	 * @see org.apache.tapestry.util.text.IMarkupCharacterTranslator#translateAttribute(char)
	 */
	public String translate(char ch) {
		// IE and Firefox do not handle characters between 128 and 159 well, 
		// so they have to be quoted as well 
		if (ch >= 160 && !_encodeNonAscii) 
			return null;
		
		if (_safeMatcher.matches(ch))
			return null;

		String entity = _entityTranslator.translate(ch);
		if (entity != null)
			return entity;
		
		// needs to use a NumberFormat here to be fully compliant, 
		// but this is accepted fine by the browsers
		return "&#" + (int) ch + ";";
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy