com.codename1.ui.html.HTMLUtils Maven / Gradle / Ivy
/*
* Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Oracle designates this
* particular file as subject to the "Classpath" exception as provided
* by Oracle in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores
* CA 94065 USA or visit www.oracle.com if you need additional information or
* have any questions.
*/
package com.codename1.ui.html;
import java.util.Hashtable;
/**
* This class contains several useful static methods for HTML
*
* @author Ofir Leitner
* @deprecated the HTML package is no longer used or maintained and may be removed in a future revision
*/
public class HTMLUtils {
// Prevents instantiation - this class has static method only
private HTMLUtils() {
}
/**
* The char entities strings supported in XML. When a char entity is found these will be compared against first.
*/
private static final String[] XML_CHAR_ENTITIES = {
"lt", // lesser-than
"gt", // greater-than
"amp", // ampersand
"quot", //quotation mark
"apos", // apostrophe
//"bull", //bullet
//"euro" //euro
};
/**
* The numericals value of char entities strings above.
*/
private static final int[] XML_CHAR_ENTITIES_VALS = {
60, // "lt", // lesser-than
62, // "gt", // greater-than
38, // "amp", // ampersand
34, // "quot", //quotation mark
39, // "apos", // apostrophe
//8226, // "bull", //bullet
//8364 // "euro"}; //euro
};
/**
* This is a list of ISO 8859-1 Symbols that can be used as HTML char entities
*/
private static final String[] HTML_BASIC_CHAR_ENTITY_STRINGS = {
"nbsp","iexcl","cent","pound","curren","yen","brvbar","sect","uml","copy","ordf","laquo","not","shy","reg","macr","deg","plusmn","sup2","sup3","acute",
"micro","para","middot","cedil","sup1","ordm","raquo","frac14","frac12","frac34","iquest","Agrave","Aacute","Acirc","Atilde","Auml","Aring","AElig",
"Ccedil","Egrave","Eacute","Ecirc","Euml","Igrave","Iacute","Icirc","Iuml","ETH","Ntilde","Ograve","Oacute","Ocirc","Otilde","Ouml","times","Oslash",
"Ugrave","Uacute","Ucirc","Uuml","Yacute","THORN","szlig","agrave","aacute","acirc","atilde","auml","aring","aelig","ccedil","egrave","eacute","ecirc",
"euml","igrave","iacute","icirc","iuml","eth","ntilde","ograve","oacute","ocirc","otilde","ouml","divide","oslash","ugrave","uacute","ucirc","uuml",
"yacute","thorn","yuml"};
/**
* Converts an XML char entity to the matching character or string.
* This is a convenience method that uses convertCharEntity with false for lookupHTMLentities and a null userDefinedCharEntities
*
* @param charEntity The char entity to convert (Not including the & and ;)
* @return A string containing a single char, or the original char entity string (with & and ;) if the char entity couldn't be resolved
*/
public static String convertXMLCharEntity(String charEntity) {
return convertCharEntity(charEntity, false, null);
}
/**
* Converts an HTML char entity to the matching character or string.
* This is a convenience method that uses convertCharEntity with true for lookupHTMLentities and a null userDefinedCharEntities
*
* @param charEntity The char entity to convert (Not including the & and ;)
* @return A string containing a single char, or the original char entity string (with & and ;) if the char entity couldn't be resolved
*/
public static String convertHTMLCharEntity(String charEntity) {
return convertCharEntity(charEntity, true, null);
}
/**
* Converts a char entity to the matching character or string.
* This handles both numbered and symbol char entities (The latter is done via getCharEntityCode)
*
* @param charEntity The char entity to convert (Not including the & and ;)
* @param lookupHTMLentities true to include the basic HTML named char entities (unicode 160-255), false otherwise
* @param userDefinedCharEntities A hashtable containing (String,int) dentoing the char entity name and its unicode
* @return A string containing a single char, or the original char entity string (with & and ;) if the char entity couldn't be resolved
*/
public static String convertCharEntity(String charEntity,boolean lookupHTMLentities,Hashtable userDefinedCharEntities) {
int charCode=-1;
if (charEntity.startsWith("#")) { //numbered char entity
if (charEntity.startsWith("#x")) { //hex
try {
charCode=Integer.parseInt(charEntity.substring(2),16);
} catch (NumberFormatException nfe) {
//if not a number - simply ignore char entity
}
} else {
try {
charCode=Integer.parseInt(charEntity.substring(1));
} catch (NumberFormatException nfe) {
//if not a number - simply ignore char entity
}
}
} else { //not numbered, rather a symbol
charCode=getCharEntityCode(charEntity,lookupHTMLentities,userDefinedCharEntities);
}
if (charCode!=-1) {
return ""+(char)charCode;
} else {
throw new IllegalArgumentException("Unknown character entity - "+charEntity);
//notifyError(ParserCallback.ERROR_UNRECOGNIZED_CHAR_ENTITY,null,null,null, "Unrecognized char entity: "+charEntity);
//return "&"+charEntity+";"; // Another option is to return an empty string, but returning the entity will unravel bugs and will also allow ignoring common mistakes such as using the & char (instead of ')
}
}
private static int getCharEntityCode(String symbol,boolean html,Hashtable userDefined) {
// First tries the XML basic char entities
int val=-1;
for (int i=0;i='a') && (c<='z')) || ((c>='A') && (c<='Z')) ||
((c>='0') && (c<='9')) ||
(c=='-') || (c=='.') || (c=='_') || (c=='~'))
{
encodedStr+=c;
} else if ((c>=0x80) && (c<=0xffff)) { // UTF encoding - See http://en.wikipedia.org/wiki/UTF-8
int firstLiteral = c/256;
int secLiteral = c%256;
if (c<=0x07ff) { // 2 literals unicode
firstLiteral=192+(firstLiteral<<2)+(secLiteral>>6);
secLiteral=128+(secLiteral & 63);
encodedStr+="%"+Integer.toHexString(firstLiteral).toUpperCase()+"%"+Integer.toHexString(secLiteral).toUpperCase();
} else { // 3 literals unicode
int thirdLiteral=128+(secLiteral & 63);
secLiteral=128+((firstLiteral%16)<<2)+(secLiteral>>6);
firstLiteral=224+(firstLiteral>>4);
encodedStr+="%"+Integer.toHexString(firstLiteral).toUpperCase()+"%"+Integer.toHexString(secLiteral).toUpperCase()
+"%"+Integer.toHexString(thirdLiteral).toUpperCase();
}
// The max value of a char is 0xffff, so though URL encoding supports values bigger than that, we can't provide for it
/*} else if (c>0xffff) { // 4 literals unicode (CJK upper ranges and others)
int z=c/65536;
int y=c%65536;
int x=y%256;
y=y/256;
int[] literal=new int[4];
literal[0]=240+(z>>2);
literal[1]=128+((z%4)<<4)+(y>>4);
literal[2]=128+((y%16)<<2)+(x>>6);
literal[3]=128+(x & 63);
for(int l=0;l
© 2015 - 2025 Weber Informatics LLC | Privacy Policy