org.jdom2.input.DOMBuilder Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of jdom Show documentation
A complete, Java-based solution for accessing, manipulating, and outputting XML data
There is a newer version: 2.0.2
/*--

 Copyright (C) 2000-2012 Jason Hunter & Brett McLaughlin.
 All rights reserved.

 Redistribution and use in source and binary forms, with or without
 modification, are permitted provided that the following conditions
 are met:

 1. Redistributions of source code must retain the above copyright
    notice, this list of conditions, and the following disclaimer.

 2. Redistributions in binary form must reproduce the above copyright
    notice, this list of conditions, and the disclaimer that follows
    these conditions in the documentation and/or other materials
    provided with the distribution.

 3. The name "JDOM" must not be used to endorse or promote products
    derived from this software without prior written permission.  For
    written permission, please contact .

 4. Products derived from this software may not be called "JDOM", nor
    may "JDOM" appear in their name, without prior written permission
    from the JDOM Project Management .

 In addition, we request (but do not require) that you include in the
 end-user documentation provided with the redistribution and/or in the
 software itself an acknowledgement equivalent to the following:
     "This product includes software developed by the
      JDOM Project (http://www.jdom.org/)."
 Alternatively, the acknowledgment may be graphical using the logos
 available at http://www.jdom.org/images/logos.

 THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
 WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
 OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
 DISCLAIMED.  IN NO EVENT SHALL THE JDOM AUTHORS OR THE PROJECT
 CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
 USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
 ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
 OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
 OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 SUCH DAMAGE.

 This software consists of voluntary contributions made by many
 individuals on behalf of the JDOM Project and was originally
 created by Jason Hunter  and
 Brett McLaughlin .  For more information
 on the JDOM Project, please see .

 */

package org.jdom2.input;

/*
 * To keep things simple, all DOM-based items are fully qualified in this code.
 * As such, there are no import org.w3c.dom.* statements...
 * This way there isless confusion about what a Document or Element is....
 */

import static org.jdom2.JDOMConstants.*;

import java.util.HashMap;

import org.jdom2.Attribute;
import org.jdom2.DefaultJDOMFactory;
import org.jdom2.DocType;
import org.jdom2.Document;
import org.jdom2.Element;
import org.jdom2.JDOMFactory;
import org.jdom2.Namespace;


/**
 * Builds a JDOM Document from a pre-existing DOM {@link org.w3c.dom.Document 
 * org.w3c.dom.Document}.
 * 
 * If you are building a document that has Namespace declarations, you should
 * ensure that the Namespaces are correctly recorded in the DOM document before
 * building the JDOM document from the DOM. By default, the native Java
 * DOMBuilderFactory is configured to ignore Namespaces, and thus they are
 * 'lost' in the DOM tree. JDOM expects Namespace-aware documents, so you
 * should ensure that you change the default settings on the
 * DOMBuilderFactory before parsing the DOM document. For example:
 * 

 * 
 *     DocumentBuilderFactory domfactory = DocumentBuilderFactory.newInstance();
 *     domfactory.setNamespaceAware(true);
 *     DocumentBuilder dombuilder = domfac.newDocumentBuilder();
 *     org.w3c.dom.Document doc = dombuilder.parse(....);
 * 
 * 
 * @author  Brett McLaughlin
 * @author  Jason Hunter
 * @author  Philip Nelson
 * @author  Kevin Regan
 * @author  Yusuf Goolamabbas
 * @author  Dan Schaffer
 * @author  Bradley S. Huffman
 */
public class DOMBuilder {

	/** The factory for creating new JDOM objects */
	private JDOMFactory factory = new DefaultJDOMFactory();

	/**
	 * This creates a new DOMBuilder instance using the DefaultJDOMFactory
	 * to build the JDOM content.
	 */
	public DOMBuilder() {
	}

	/**
	 * This sets a custom JDOMFactory for the builder.  Use this to build
	 * the tree with your own subclasses of the JDOM classes.
	 *
	 * @param factory JDOMFactory to use
	 */
	public void setFactory(JDOMFactory factory) {
		this.factory = factory;
	}

	/**
	 * Returns the current {@link org.jdom2.JDOMFactory} in use.
	 * @return the factory in use
	 */
	public JDOMFactory getFactory() {
		return factory;
	}

	/**
	 * This will build a JDOM tree from an existing DOM tree.
	 *
	 * @param domDocument org.w3c.dom.Document object
	 * @return Document - JDOM document object.
	 */
	public Document build(org.w3c.dom.Document domDocument) {
		Document doc = factory.document(null);
		buildTree(domDocument, doc, null, true);
		return doc;
	}

	/**
	 * This will build a JDOM Element from an existing DOM Element
	 *
	 * @param domElement  org.w3c.dom.Element object
	 * @return Element - JDOM Element object
	 */
	public org.jdom2.Element build(org.w3c.dom.Element domElement) {
		Document doc = factory.document(null);
		buildTree(domElement, doc, null, true);
		return doc.getRootElement();
	}
	
	/**
	 * This will build a JDOM CDATA from an existing DOM CDATASection
	 *
	 * @param cdata  org.w3c.dom.CDATASection object
	 * @return CDATA - JDOM CDATA object
	 * @since JDOM2
	 */
	public org.jdom2.CDATA build(org.w3c.dom.CDATASection cdata) {
		return factory.cdata(cdata.getTextContent());
	}
	
	/**
	 * This will build a JDOM Text from an existing DOM Text
	 *
	 * @param text  org.w3c.dom.Text object
	 * @return Text - JDOM Text object
	 * @since JDOM2
	 */
	public org.jdom2.Text build(org.w3c.dom.Text text) {
		return factory.text(text.getTextContent());
	}
	
	/**
	 * This will build a JDOM Comment from an existing DOM Comment
	 *
	 * @param comment  org.w3c.dom.Comment object
	 * @return Comment - JDOM Comment object
	 * @since JDOM2
	 */
	public org.jdom2.Comment build(org.w3c.dom.Comment comment) {
		return factory.comment(comment.getTextContent());
	}
	
	/**
	 * This will build a JDOM ProcessingInstruction from an existing DOM ProcessingInstruction
	 *
	 * @param pi  org.w3c.dom.ProcessingInstruction object
	 * @return ProcessingInstruction - JDOM ProcessingInstruction object
	 * @since JDOM2
	 */
	public org.jdom2.ProcessingInstruction build(org.w3c.dom.ProcessingInstruction pi) {
		return factory.processingInstruction(pi.getTarget(), pi.getData());
	}
	
	/**
	 * This will build a JDOM EntityRef from an existing DOM EntityReference
	 *
	 * @param er  org.w3c.dom.EntityReference object
	 * @return EnityRef - JDOM EntityRef object
	 * @since JDOM2
	 */
	public org.jdom2.EntityRef build(org.w3c.dom.EntityReference er) {
		return factory.entityRef(er.getNodeName());
	}
	
	/**
	 * This will build a JDOM Element from an existing DOM Element
	 *
	 * @param doctype  org.w3c.dom.Element object
	 * @return Element - JDOM Element object
	 * @since JDOM2
	 */
	public org.jdom2.DocType build(org.w3c.dom.DocumentType doctype) {
		String publicID = doctype.getPublicId();
		String systemID = doctype.getSystemId();
		String internalDTD = doctype.getInternalSubset();

		DocType docType = factory.docType(doctype.getName());
		docType.setPublicID(publicID);
		docType.setSystemID(systemID);
		docType.setInternalSubset(internalDTD);
		return docType;
	}
	
	

	/**
	 * This takes a DOM Node and builds up
	 * a JDOM tree, recursing until the DOM tree is exhausted
	 * and the JDOM tree results.
	 *
	 * @param node Code to examine.
	 * @param doc JDOM Document being built.
	 * @param current Element that is current parent.
	 * @param atRoot boolean indicating whether at root level.
	 */
	private void buildTree(org.w3c.dom.Node node,
			Document doc,
			Element current,
			boolean atRoot) {
		// Recurse through the tree
		switch (node.getNodeType()) {
			case org.w3c.dom.Node.DOCUMENT_NODE:
				org.w3c.dom.NodeList nodes = node.getChildNodes();
				for (int i=0, size=nodes.getLength(); i= 0) {
					prefix = nodeName.substring(0, colon);
					localName = nodeName.substring(colon + 1);
				}

				// Get element's namespace
				Namespace ns = null;
				String uri = node.getNamespaceURI();
				if (uri == null) {
					ns = (current == null) ? Namespace.NO_NAMESPACE
							: current.getNamespace(prefix);
				}
				else {
					ns = Namespace.getNamespace(prefix, uri);
				}

				Element element = factory.element(localName, ns);

				if (atRoot) {
					// If at root, set as document root
					factory.setRoot(doc, element);
				} else {
					// else add to parent element
					factory.addContent(current, element);
				}

				// Add namespaces
				org.w3c.dom.NamedNodeMap attributeList = node.getAttributes();
				int attsize = attributeList.getLength();

				for (int i = 0; i < attsize; i++) {
					org.w3c.dom.Attr att = (org.w3c.dom.Attr) attributeList.item(i);

					String attname = att.getName();
					if (attname.startsWith(NS_PREFIX_XMLNS)) {
						String attPrefix = NS_PREFIX_DEFAULT;
						colon = attname.indexOf(':');
						if (colon >= 0) {
							attPrefix = attname.substring(colon + 1);
						}

						String attvalue = att.getValue();

						Namespace declaredNS =
								Namespace.getNamespace(attPrefix, attvalue);

						// Add as additional namespaces if it's different
						// to this element's namespace (perhaps we should
						// also have logic not to mark them as additional if
						// it's been done already, but it probably doesn't
						// matter)
						if (prefix.equals(attPrefix)) {
							// RL: note, it should also be true that uri.equals(attvalue)
							// if not, then the parser is boken.
							// further, declaredNS should be exactly the same as ns
							// so the following should in fact do nothing.
							element.setNamespace(declaredNS);
						}
						else {
							factory.addNamespaceDeclaration(element, declaredNS);
						}
					}
				}

				// Add attributes
				for (int i = 0; i < attsize; i++) {
					org.w3c.dom.Attr att = (org.w3c.dom.Attr) attributeList.item(i);

					String attname = att.getName();

					if ( !attname.startsWith(NS_PREFIX_XMLNS)) {
						String attPrefix = NS_PREFIX_DEFAULT;
						String attLocalName = attname;
						colon = attname.indexOf(':');
						if (colon >= 0) {
							attPrefix = attname.substring(0, colon);
							attLocalName = attname.substring(colon + 1);
						}

						String attvalue = att.getValue();

						// Get attribute's namespace
						Namespace attNS = null;
						String attURI = att.getNamespaceURI(); 
						if (attURI == null || NS_URI_DEFAULT.equals(attURI)) {
							attNS = Namespace.NO_NAMESPACE;
						} else {
							// various conditions can lead here.
							// the logical one is that we have a prefix for the
							// attribute, and also a namespace URI.
							// The alternative to that is in some conditions,
							// the parser could have a 'default' or 'fixed'
							// attribute that comes from an XSD used for
							// validation. In that case there may not be a prefix
							// There's also the possibility the DOM contains
							// garbage.
							if (attPrefix.length() > 0) {
								// If the att has a prefix, we can assume that
								// the DOM is valid, and we can just use the prefix.
								// if this prefix conflicts with some other namespace
								// then we re-declare it. If redeclaring it screws up
								// other attributes in this Element, then the DOM
								// was broken to start with.
								attNS = Namespace.getNamespace(attPrefix, attURI);
							} else {
								// OK, no prefix.
								// must be a defaulted value from an XSD.
								// perhaps we can find the namespace in our
								// element's ancestry, and use the prefix from that.
								HashMap tmpmap = new HashMap();
								for(Namespace nss : element.getNamespacesInScope()) {
									if (nss.getPrefix().length() > 0 && nss.getURI().equals(attURI)) {
										attNS = nss;
										break;
									}
									tmpmap.put(nss.getPrefix(), nss);
								}
								if (attNS == null) {
									// we cannot find a 'prevailing' namespace that has a prefix
									// that is for this namespace.
									// This basically means that there's an XMLSchema, for the
									// DEFAULT namespace, and there's a defaulted/fixed
									// attribute definition in the XMLSchema that's targeted
									// for this namespace,... but, the user has either not
									// declared a prefixed version of the namespace, or has
									// re-declared the same prefix at a lower level with a
									// different namespace.
									// All of these things are possible.
									// Create some sort of default prefix.
									int cnt = 0;
									String base = "attns";
									String pfx = base + cnt;
									while (tmpmap.containsKey(pfx)) {
										cnt++;
										pfx = base + cnt;
									}
									attNS = Namespace.getNamespace(pfx, attURI);
								}
							}
						}

						Attribute attribute =
								factory.attribute(attLocalName, attvalue, attNS);
						factory.setAttribute(element, attribute);
					}
				}

				// Recurse on child nodes
				// The list should never be null nor should it ever contain
				// null nodes, but some DOM impls are broken
				org.w3c.dom.NodeList children = node.getChildNodes();
				if (children != null) {
					int size = children.getLength();
					for (int i = 0; i < size; i++) {
						org.w3c.dom.Node item = children.item(i);
						if (item != null) {
							buildTree(item, doc, element, false);
						}
					}
				}
				break;

			case org.w3c.dom.Node.TEXT_NODE:
				factory.addContent(current, build((org.w3c.dom.Text)node));
				break;

			case org.w3c.dom.Node.CDATA_SECTION_NODE:
				factory.addContent(current, build((org.w3c.dom.CDATASection)node));
				break;


			case org.w3c.dom.Node.PROCESSING_INSTRUCTION_NODE:
				if (atRoot) {
					factory.addContent(doc, build((org.w3c.dom.ProcessingInstruction)node));
				} else {
					factory.addContent(current, build((org.w3c.dom.ProcessingInstruction)node));
				}
				break;

			case org.w3c.dom.Node.COMMENT_NODE:
				if (atRoot) {
					factory.addContent(doc, build((org.w3c.dom.Comment)node));
				} else {
					factory.addContent(current, build((org.w3c.dom.Comment)node));
				}
				break;

			case org.w3c.dom.Node.ENTITY_REFERENCE_NODE:
				factory.addContent(current, build((org.w3c.dom.EntityReference)node));
				break;

			case org.w3c.dom.Node.ENTITY_NODE:
				// ??
						break;

			case org.w3c.dom.Node.DOCUMENT_TYPE_NODE:

				factory.addContent(doc, build((org.w3c.dom.DocumentType)node));
				break;
		}
	}
}