jodd.lagarto.dom.LagartoHtmlRendererNodeVisitor Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of extractor Show documentation
Show all versions of extractor Show documentation
Web Data Extractor - Extract data from common web format. like HTML,XML,JSON.
The newest version!
// Copyright (c) 2003-present, Jodd Team (http://jodd.org)
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
//
// 2. Redistributions in binary form must reproduce the above copyright
// notice, this list of conditions and the following disclaimer in the
// documentation and/or other materials provided with the distribution.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
package jodd.lagarto.dom;
import jodd.lagarto.TagWriterUtil;
import jodd.util.HtmlEncoder;
import java.io.IOException;
/**
* {@link NodeVisitor} that renders DOM tree to string.
*/
public class LagartoHtmlRendererNodeVisitor implements NodeVisitor {
protected final Appendable appendable;
public LagartoHtmlRendererNodeVisitor(Appendable appendable) {
this.appendable = appendable;
}
public void cdata(CData cdata) {
String nodeValue = cdata.getNodeValue();
try {
TagWriterUtil.writeCData(appendable, nodeValue);
} catch (IOException ioex) {
throw new LagartoDOMException(ioex);
}
}
public void comment(Comment comment) {
String nodeValue = comment.getNodeValue();
try {
TagWriterUtil.writeComment(appendable, nodeValue);
} catch (IOException ioex) {
throw new LagartoDOMException(ioex);
}
}
public void document(Document document) {
document.visitChildren(this);
}
public void documentType(DocumentType documentType) {
try {
TagWriterUtil.writeDoctype(appendable,
documentType.nodeValue,
documentType.publicId,
documentType.systemId);
} catch (IOException ioex) {
throw new LagartoDOMException(ioex);
}
}
public void text(Text text) {
String nodeValue = text.getTextContent();
try {
appendable.append(nodeValue);
} catch (IOException ioex) {
throw new LagartoDOMException(ioex);
}
}
public void xmlDeclaration(XmlDeclaration xmlDeclaration) {
try {
TagWriterUtil.writeXml(appendable,
xmlDeclaration.getVersion(), xmlDeclaration.getEncoding(), xmlDeclaration.getStandalone());
} catch (IOException ioex) {
throw new LagartoDOMException(ioex);
}
}
// ---------------------------------------------------------------- element
/**
* Enumeration of case options for output name.
*/
public enum Case {
/**
* Default case, depends on parser case sensitivity.
*/
DEFAULT,
/**
* Raw name, no modifications.
*/
RAW,
/**
* Lowercase name.
*/
LOWERCASE,
/**
* Uppercase name.
*/
UPPERCASE,
}
/**
* Letter case of tag names.
*/
protected Case tagCase = Case.DEFAULT;
/**
* Letter case of attributes names.
*/
protected Case attributeCase = Case.DEFAULT;
/**
* Sets {@link Case case} of tag names.
*/
public void setTagCase(Case tagCase) {
this.tagCase = tagCase;
}
public Case getTagCase() {
return tagCase;
}
/**
* Sets {@link Case case} of attribute names.
*/
public void setAttributeCase(Case attributeCase) {
this.attributeCase = attributeCase;
}
public Case getAttributeCase() {
return attributeCase;
}
/**
* Resets all cases to default.
*/
public void reset() {
tagCase = Case.DEFAULT;
attributeCase = Case.DEFAULT;
}
/**
* Renders node name.
*/
protected String resolveNodeName(Node node) {
switch (tagCase) {
case DEFAULT:
return node.getNodeName();
case RAW:
return node.getNodeRawName();
case LOWERCASE:
return node.getNodeRawName().toLowerCase();
case UPPERCASE:
return node.getNodeRawName().toUpperCase();
}
return null;
}
/**
* Renders attribute name.
*/
protected String resolveAttributeName(Node node, Attribute attribute) {
switch (attributeCase) {
case DEFAULT:
return attribute.getName();
case RAW:
return attribute.getRawName();
case LOWERCASE:
return attribute.getRawName().toLowerCase();
case UPPERCASE:
return attribute.getRawName().toUpperCase();
}
return null;
}
/**
* Renders attribute.
*/
protected void renderAttribute(Node node, Attribute attribute, Appendable appendable) throws IOException {
String name = resolveAttributeName(node, attribute);
String value = attribute.getValue();
appendable.append(name);
if (value != null) {
appendable.append('=');
appendable.append('\"');
appendable.append(HtmlEncoder.attributeDoubleQuoted(value));
appendable.append('\"');
}
}
public void element(Element element) {
try {
_element(element);
} catch (IOException ioex) {
throw new LagartoDOMException(ioex);
}
}
protected void _element(Element element) throws IOException {
String nodeName = resolveNodeName(element);
appendable.append('<');
appendable.append(nodeName);
int attrCount = element.getAttributesCount();
if (attrCount != 0) {
for (int i = 0; i < attrCount; i++) {
Attribute attr = element.getAttribute(i);
appendable.append(' ');
renderAttribute(element, attr, appendable);
}
}
int childCount = element.getChildNodesCount();
if (element.selfClosed && childCount == 0) {
appendable.append("/>");
return;
}
appendable.append('>');
if (element.voidElement) {
return;
}
if (childCount != 0) {
elementBody(element);
}
appendable.append("");
appendable.append(nodeName);
appendable.append('>');
}
protected void elementBody(Element element) throws IOException {
int childCount = element.getChildNodesCount();
if (element.isRawTag()) {
for (int i = 0; i < childCount; i++) {
Node childNode = element.getChild(i);
if (childNode.getNodeType() == Node.NodeType.TEXT) {
appendable.append(childNode.getNodeValue());
} else {
childNode.visit(this);
}
}
} else {
element.visitChildren(this);
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy