All Downloads are FREE. Search and download functionalities are using the official Maven repository.

jodd.lagarto.dom.HtmlImplicitClosingRules Maven / Gradle / Ivy

Go to download

Jodd Lagarto is fast and versatile all purpose HTML parser. Includes Jerry and CSSelly.

There is a newer version: 6.0.6
Show newest version
// Copyright (c) 2003-present, Jodd Team (http://jodd.org)
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.

package jodd.lagarto.dom;

import jodd.util.StringUtil;

/**
 * HTML rules for implicitly closing tags.
 */
public class HtmlImplicitClosingRules {

	// ---------------------------------------------------------------- start

	/**
	 * List of tags that can be implicitly closed on provided children.
	 * The first array contains parent tag name (i.e. parent node name),
	 * that can be closed.
	 * The second array contains list of all children that will
	 * implicitly close the parent (i.e. current node name).
	 * 

* Interpret it like this: [second array OPEN tag] closes [first array tag] */ public static final String[][] IMPLIED_ON_START = new String[][] { new String[] {"p"}, new String[] { "address", "article", "aside", "blockquote", "center", "details", "dir", "div", "dl", "fieldset", "figcaption", "figure", "footer", "header", "hgroup", "menu", "nav", "ol", "p", "section", "summary", "ul", "h1", "h2", "h3", "h4", "h5", "h6", "pre", "listing", "form", "li", "dd", "dt", "plaintext", "table", "hr", "xmp", }, new String[] {"dd", "dt"}, new String[] {"dd", "dt"}, new String[] {"li"}, new String[] {"li"}, new String[] {"td"}, new String[] {"td"}, new String[] {"th"}, new String[] {"th"}, new String[] {"tr", "td", "th", "colgroup"}, new String[] {"tr"}, new String[] {"thead", "tr", "td", "th", "colgroup"}, new String[] {"tbody"}, new String[] {"tbody", "tr", "td", "th"}, new String[] {"tfoot"}, new String[] {"colgroup"}, new String[] {"thead"}, new String[] {"colgroup"}, new String[] {"colgroup"}, new String[] {"optgroup"}, new String[] {"optgroup"}, new String[] {"head"}, new String[] {"body"}, }; /** * Returns true if parent node tag can be closed implicitly. */ public boolean implicitlyCloseParentTagOnNewTag(String parentNodeName, String nodeName) { if (parentNodeName == null) { return false; } parentNodeName = parentNodeName.toLowerCase(); nodeName = nodeName.toLowerCase(); for (int i = 0; i < IMPLIED_ON_START.length; i+=2) { if (StringUtil.equalsOne(parentNodeName, IMPLIED_ON_START[i]) != -1) { if (StringUtil.equalsOne(nodeName, IMPLIED_ON_START[i + 1]) != -1) { return true; } } } return false; } // ---------------------------------------------------------------- close /** * List of tags that can be implicitly closed on tags end. * The first array contains current node name (i.e. ending tag). * The second array contains list of all of parent tags that can be closed. *

* Interpret it like this: [first array CLOSE tag] closes [second array tag] */ public static final String[][] IMPLIED_ON_END = new String[][] { new String[] {"dl"}, new String[] {"dd", "dt"}, new String[] {"ul", "ol"}, new String[] {"li"}, new String[] {"table"}, new String[] {"th", "td", "tr", "tbody", "tfoot", "thead"}, new String[] {"select"}, new String[] {"optgroup"}, new String[] {"body"}, new String[] {"dd", "dt", "li", "optgroup", "option", "p", "tbody", "td", "tfoot", "th", "thead", "tr", "html"}, new String[] {"html"}, new String[] {"dd", "dt", "li", "optgroup", "option", "p", "tbody", "td", "tfoot", "th", "thead", "tr", "body"}, }; /** * Returns true if current end tag (node name) closes the parent tag. */ public boolean implicitlyCloseParentTagOnTagEnd(String parentNodeName, String nodeName) { if (parentNodeName == null) { return false; } parentNodeName = parentNodeName.toLowerCase(); nodeName = nodeName.toLowerCase(); for (int i = 0; i < IMPLIED_ON_END.length; i += 2) { if (StringUtil.equalsOne(nodeName, IMPLIED_ON_END[i]) != -1) { if (StringUtil.equalsOne(parentNodeName, IMPLIED_ON_END[i + 1]) != -1) { return true; } } } return false; } // ---------------------------------------------------------------- eof public static final String[] CLOSED_ON_EOF = new String[] { "dd", "dt", "li", "p", "tbody", "td", "tfoot", "th", "thead", "tr", "body", "html" }; /** * Returns true if tag should be closed on EOF. */ public boolean implicitlyCloseTagOnEOF(String nodeName) { if (nodeName == null) { return false; } nodeName = nodeName.toLowerCase(); return StringUtil.equalsOne(nodeName, CLOSED_ON_EOF) != -1; } }





© 2015 - 2024 Weber Informatics LLC | Privacy Policy