org.jdom2.input.DOMBuilder Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of jdom Show documentation
Show all versions of jdom Show documentation
A complete, Java-based solution for accessing, manipulating,
and outputting XML data
/*--
Copyright (C) 2000-2012 Jason Hunter & Brett McLaughlin.
All rights reserved.
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
1. Redistributions of source code must retain the above copyright
notice, this list of conditions, and the following disclaimer.
2. Redistributions in binary form must reproduce the above copyright
notice, this list of conditions, and the disclaimer that follows
these conditions in the documentation and/or other materials
provided with the distribution.
3. The name "JDOM" must not be used to endorse or promote products
derived from this software without prior written permission. For
written permission, please contact .
4. Products derived from this software may not be called "JDOM", nor
may "JDOM" appear in their name, without prior written permission
from the JDOM Project Management .
In addition, we request (but do not require) that you include in the
end-user documentation provided with the redistribution and/or in the
software itself an acknowledgement equivalent to the following:
"This product includes software developed by the
JDOM Project (http://www.jdom.org/)."
Alternatively, the acknowledgment may be graphical using the logos
available at http://www.jdom.org/images/logos.
THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
DISCLAIMED. IN NO EVENT SHALL THE JDOM AUTHORS OR THE PROJECT
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
SUCH DAMAGE.
This software consists of voluntary contributions made by many
individuals on behalf of the JDOM Project and was originally
created by Jason Hunter and
Brett McLaughlin . For more information
on the JDOM Project, please see .
*/
package org.jdom2.input;
/*
* To keep things simple, all DOM-based items are fully qualified in this code.
* As such, there are no import org.w3c.dom.* statements...
* This way there isless confusion about what a Document or Element is....
*/
import static org.jdom2.JDOMConstants.*;
import java.util.HashMap;
import org.jdom2.Attribute;
import org.jdom2.DefaultJDOMFactory;
import org.jdom2.DocType;
import org.jdom2.Document;
import org.jdom2.Element;
import org.jdom2.JDOMFactory;
import org.jdom2.Namespace;
/**
* Builds a JDOM Document from a pre-existing DOM {@link org.w3c.dom.Document
* org.w3c.dom.Document}.
*
* If you are building a document that has Namespace declarations, you should
* ensure that the Namespaces are correctly recorded in the DOM document before
* building the JDOM document from the DOM. By default, the native Java
* DOMBuilderFactory is configured to ignore Namespaces, and thus they are
* 'lost' in the DOM tree. JDOM expects Namespace-aware documents, so you
* should ensure that you change the default settings on the
* DOMBuilderFactory before parsing the DOM document. For example:
*
*
* DocumentBuilderFactory domfactory = DocumentBuilderFactory.newInstance();
* domfactory.setNamespaceAware(true);
* DocumentBuilder dombuilder = domfac.newDocumentBuilder();
* org.w3c.dom.Document doc = dombuilder.parse(....);
*
*
* @author Brett McLaughlin
* @author Jason Hunter
* @author Philip Nelson
* @author Kevin Regan
* @author Yusuf Goolamabbas
* @author Dan Schaffer
* @author Bradley S. Huffman
*/
public class DOMBuilder {
/** The factory for creating new JDOM objects */
private JDOMFactory factory = new DefaultJDOMFactory();
/**
* This creates a new DOMBuilder instance using the DefaultJDOMFactory
* to build the JDOM content.
*/
public DOMBuilder() {
}
/**
* This sets a custom JDOMFactory for the builder. Use this to build
* the tree with your own subclasses of the JDOM classes.
*
* @param factory JDOMFactory
to use
*/
public void setFactory(JDOMFactory factory) {
this.factory = factory;
}
/**
* Returns the current {@link org.jdom2.JDOMFactory} in use.
* @return the factory in use
*/
public JDOMFactory getFactory() {
return factory;
}
/**
* This will build a JDOM tree from an existing DOM tree.
*
* @param domDocument org.w3c.dom.Document
object
* @return Document
- JDOM document object.
*/
public Document build(org.w3c.dom.Document domDocument) {
Document doc = factory.document(null);
buildTree(domDocument, doc, null, true);
return doc;
}
/**
* This will build a JDOM Element from an existing DOM Element
*
* @param domElement org.w3c.dom.Element
object
* @return Element
- JDOM Element object
*/
public org.jdom2.Element build(org.w3c.dom.Element domElement) {
Document doc = factory.document(null);
buildTree(domElement, doc, null, true);
return doc.getRootElement();
}
/**
* This will build a JDOM CDATA from an existing DOM CDATASection
*
* @param cdata org.w3c.dom.CDATASection
object
* @return CDATA
- JDOM CDATA object
* @since JDOM2
*/
public org.jdom2.CDATA build(org.w3c.dom.CDATASection cdata) {
return factory.cdata(cdata.getTextContent());
}
/**
* This will build a JDOM Text from an existing DOM Text
*
* @param text org.w3c.dom.Text
object
* @return Text
- JDOM Text object
* @since JDOM2
*/
public org.jdom2.Text build(org.w3c.dom.Text text) {
return factory.text(text.getTextContent());
}
/**
* This will build a JDOM Comment from an existing DOM Comment
*
* @param comment org.w3c.dom.Comment
object
* @return Comment
- JDOM Comment object
* @since JDOM2
*/
public org.jdom2.Comment build(org.w3c.dom.Comment comment) {
return factory.comment(comment.getTextContent());
}
/**
* This will build a JDOM ProcessingInstruction from an existing DOM ProcessingInstruction
*
* @param pi org.w3c.dom.ProcessingInstruction
object
* @return ProcessingInstruction
- JDOM ProcessingInstruction object
* @since JDOM2
*/
public org.jdom2.ProcessingInstruction build(org.w3c.dom.ProcessingInstruction pi) {
return factory.processingInstruction(pi.getTarget(), pi.getData());
}
/**
* This will build a JDOM EntityRef from an existing DOM EntityReference
*
* @param er org.w3c.dom.EntityReference
object
* @return EnityRef
- JDOM EntityRef object
* @since JDOM2
*/
public org.jdom2.EntityRef build(org.w3c.dom.EntityReference er) {
return factory.entityRef(er.getNodeName());
}
/**
* This will build a JDOM Element from an existing DOM Element
*
* @param doctype org.w3c.dom.Element
object
* @return Element
- JDOM Element object
* @since JDOM2
*/
public org.jdom2.DocType build(org.w3c.dom.DocumentType doctype) {
String publicID = doctype.getPublicId();
String systemID = doctype.getSystemId();
String internalDTD = doctype.getInternalSubset();
DocType docType = factory.docType(doctype.getName());
docType.setPublicID(publicID);
docType.setSystemID(systemID);
docType.setInternalSubset(internalDTD);
return docType;
}
/**
* This takes a DOM Node
and builds up
* a JDOM tree, recursing until the DOM tree is exhausted
* and the JDOM tree results.
*
* @param node Code to examine.
* @param doc JDOM Document
being built.
* @param current Element
that is current parent.
* @param atRoot boolean
indicating whether at root level.
*/
private void buildTree(org.w3c.dom.Node node,
Document doc,
Element current,
boolean atRoot) {
// Recurse through the tree
switch (node.getNodeType()) {
case org.w3c.dom.Node.DOCUMENT_NODE:
org.w3c.dom.NodeList nodes = node.getChildNodes();
for (int i=0, size=nodes.getLength(); i= 0) {
prefix = nodeName.substring(0, colon);
localName = nodeName.substring(colon + 1);
}
// Get element's namespace
Namespace ns = null;
String uri = node.getNamespaceURI();
if (uri == null) {
ns = (current == null) ? Namespace.NO_NAMESPACE
: current.getNamespace(prefix);
}
else {
ns = Namespace.getNamespace(prefix, uri);
}
Element element = factory.element(localName, ns);
if (atRoot) {
// If at root, set as document root
factory.setRoot(doc, element);
} else {
// else add to parent element
factory.addContent(current, element);
}
// Add namespaces
org.w3c.dom.NamedNodeMap attributeList = node.getAttributes();
int attsize = attributeList.getLength();
for (int i = 0; i < attsize; i++) {
org.w3c.dom.Attr att = (org.w3c.dom.Attr) attributeList.item(i);
String attname = att.getName();
if (attname.startsWith(NS_PREFIX_XMLNS)) {
String attPrefix = NS_PREFIX_DEFAULT;
colon = attname.indexOf(':');
if (colon >= 0) {
attPrefix = attname.substring(colon + 1);
}
String attvalue = att.getValue();
Namespace declaredNS =
Namespace.getNamespace(attPrefix, attvalue);
// Add as additional namespaces if it's different
// to this element's namespace (perhaps we should
// also have logic not to mark them as additional if
// it's been done already, but it probably doesn't
// matter)
if (prefix.equals(attPrefix)) {
// RL: note, it should also be true that uri.equals(attvalue)
// if not, then the parser is boken.
// further, declaredNS should be exactly the same as ns
// so the following should in fact do nothing.
element.setNamespace(declaredNS);
}
else {
factory.addNamespaceDeclaration(element, declaredNS);
}
}
}
// Add attributes
for (int i = 0; i < attsize; i++) {
org.w3c.dom.Attr att = (org.w3c.dom.Attr) attributeList.item(i);
String attname = att.getName();
if ( !attname.startsWith(NS_PREFIX_XMLNS)) {
String attPrefix = NS_PREFIX_DEFAULT;
String attLocalName = attname;
colon = attname.indexOf(':');
if (colon >= 0) {
attPrefix = attname.substring(0, colon);
attLocalName = attname.substring(colon + 1);
}
String attvalue = att.getValue();
// Get attribute's namespace
Namespace attNS = null;
String attURI = att.getNamespaceURI();
if (attURI == null || NS_URI_DEFAULT.equals(attURI)) {
attNS = Namespace.NO_NAMESPACE;
} else {
// various conditions can lead here.
// the logical one is that we have a prefix for the
// attribute, and also a namespace URI.
// The alternative to that is in some conditions,
// the parser could have a 'default' or 'fixed'
// attribute that comes from an XSD used for
// validation. In that case there may not be a prefix
// There's also the possibility the DOM contains
// garbage.
if (attPrefix.length() > 0) {
// If the att has a prefix, we can assume that
// the DOM is valid, and we can just use the prefix.
// if this prefix conflicts with some other namespace
// then we re-declare it. If redeclaring it screws up
// other attributes in this Element, then the DOM
// was broken to start with.
attNS = Namespace.getNamespace(attPrefix, attURI);
} else {
// OK, no prefix.
// must be a defaulted value from an XSD.
// perhaps we can find the namespace in our
// element's ancestry, and use the prefix from that.
HashMap tmpmap = new HashMap();
for(Namespace nss : element.getNamespacesInScope()) {
if (nss.getPrefix().length() > 0 && nss.getURI().equals(attURI)) {
attNS = nss;
break;
}
tmpmap.put(nss.getPrefix(), nss);
}
if (attNS == null) {
// we cannot find a 'prevailing' namespace that has a prefix
// that is for this namespace.
// This basically means that there's an XMLSchema, for the
// DEFAULT namespace, and there's a defaulted/fixed
// attribute definition in the XMLSchema that's targeted
// for this namespace,... but, the user has either not
// declared a prefixed version of the namespace, or has
// re-declared the same prefix at a lower level with a
// different namespace.
// All of these things are possible.
// Create some sort of default prefix.
int cnt = 0;
String base = "attns";
String pfx = base + cnt;
while (tmpmap.containsKey(pfx)) {
cnt++;
pfx = base + cnt;
}
attNS = Namespace.getNamespace(pfx, attURI);
}
}
}
Attribute attribute =
factory.attribute(attLocalName, attvalue, attNS);
factory.setAttribute(element, attribute);
}
}
// Recurse on child nodes
// The list should never be null nor should it ever contain
// null nodes, but some DOM impls are broken
org.w3c.dom.NodeList children = node.getChildNodes();
if (children != null) {
int size = children.getLength();
for (int i = 0; i < size; i++) {
org.w3c.dom.Node item = children.item(i);
if (item != null) {
buildTree(item, doc, element, false);
}
}
}
break;
case org.w3c.dom.Node.TEXT_NODE:
factory.addContent(current, build((org.w3c.dom.Text)node));
break;
case org.w3c.dom.Node.CDATA_SECTION_NODE:
factory.addContent(current, build((org.w3c.dom.CDATASection)node));
break;
case org.w3c.dom.Node.PROCESSING_INSTRUCTION_NODE:
if (atRoot) {
factory.addContent(doc, build((org.w3c.dom.ProcessingInstruction)node));
} else {
factory.addContent(current, build((org.w3c.dom.ProcessingInstruction)node));
}
break;
case org.w3c.dom.Node.COMMENT_NODE:
if (atRoot) {
factory.addContent(doc, build((org.w3c.dom.Comment)node));
} else {
factory.addContent(current, build((org.w3c.dom.Comment)node));
}
break;
case org.w3c.dom.Node.ENTITY_REFERENCE_NODE:
factory.addContent(current, build((org.w3c.dom.EntityReference)node));
break;
case org.w3c.dom.Node.ENTITY_NODE:
// ??
break;
case org.w3c.dom.Node.DOCUMENT_TYPE_NODE:
factory.addContent(doc, build((org.w3c.dom.DocumentType)node));
break;
}
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy