net.sf.saxon.om.NodeInfo Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of saxon-he Show documentation
An OSGi bundle for Saxon-HE
There is a newer version: 10.5
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2013 Saxonica Limited.
// This Source Code Form is subject to the terms of the Mozilla Public License, v. 2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
// This Source Code Form is "Incompatible With Secondary Licenses", as defined by the Mozilla Public License, v. 2.0.
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////

package net.sf.saxon.om;

import net.sf.saxon.Configuration;
import net.sf.saxon.event.Receiver;
import net.sf.saxon.pattern.NodeTest;
import net.sf.saxon.trans.XPathException;
import net.sf.saxon.tree.iter.AxisIterator;
import net.sf.saxon.tree.util.FastStringBuffer;
import net.sf.saxon.type.SchemaType;

import javax.xml.transform.Source;

/**
 * The NodeInfo interface represents a node in Saxon's implementation of the XPath 2.0 data model.
 * 
 * Note that several NodeInfo objects may represent the same node. To test node identity, the
 * method {@link #isSameNodeInfo(NodeInfo)} should be used. An exception to this rule applies for
 * document nodes, where the correspondence between document nodes and DocumentInfo objects is one to
 * one. NodeInfo objects are never reused: a given NodeInfo object represents the same node for its entire
 * lifetime.
 * 

 * This is the primary interface for accessing trees in Saxon, and it forms part of the public
 * Saxon API. The only subclass of NodeInfo that applications should normally use is {@link DocumentInfo},
 * which represents a document node. Methods that form part of the public API are (since Saxon 8.4)
 * labelled with a JavaDoc "since" tag: classes and methods that have no such label should not be
 * regarded as stable interfaces.
 * 

 * The interface represented by this class is at a slightly higher level than the abstraction described
 * in the W3C data model specification, in that it includes support for the XPath axes, rather than exposing
 * the lower-level properties (such as "parent" and "children") directly. All navigation within trees,
 * except for a few convenience methods, is done by following the axes using the {@link #iterateAxis} method.
 * This allows different implementations of the XPath tree model to implement axis navigation in different ways.
 * Some implementations may choose to use the helper methods provided in class {@link net.sf.saxon.tree.util.Navigator}.
 * 

 * Note that the stability of this interface applies to classes that use the interface,
 * not to classes that implement it. The interface may be extended in future to add new methods.
 * 

 * New implementations of NodeInfo are advised also to implement the methods in interface
 * ExtendedNodeInfo, which will be moved into this interface at some time in the future.
 *
 * @author Michael H. Kay
 * @since 8.4. Extended with three extra methods, previously in ExtendedNodeInfo, in 9.1
 */

public interface NodeInfo extends Source, Item {

    /**
     * Get the kind of node. This will be a value such as {@link net.sf.saxon.type.Type#ELEMENT}
     * or {@link net.sf.saxon.type.Type#ATTRIBUTE}. There are seven kinds of node: documents, elements, attributes,
     * text, comments, processing-instructions, and namespaces.
     *
     * @return an integer identifying the kind of node. These integer values are the
     * same as those used in the DOM
     * @see net.sf.saxon.type.Type
     * @since 8.4
     */

    public int getNodeKind();

    /**
     * Determine whether this is the same node as another node.
     * 

     * Note that two different NodeInfo instances can represent the same conceptual node.
     * Therefore the "==" operator should not be used to test node identity. The equals()
     * method should give the same result as isSameNodeInfo(), but since this rule was introduced
     * late it might not apply to all implementations.
     * 

     * Note: a.isSameNodeInfo(b) if and only if generateId(a)==generateId(b).
     * 

     * This method has the same semantics as isSameNode() in DOM Level 3, but
     * works on Saxon NodeInfo objects rather than DOM Node objects.
     *
     * @param other the node to be compared with this node
     * @return true if this NodeInfo object and the supplied NodeInfo object represent
     *      the same node in the tree.
     */

    public boolean isSameNodeInfo(NodeInfo other);

    /**
     * The equals() method compares nodes for identity. It is defined to give the same result
     * as isSameNodeInfo().
     * @param other the node to be compared with this node
     * @return true if this NodeInfo object and the supplied NodeInfo object represent
     *      the same node in the tree.
     * @since 8.7 Previously, the effect of the equals() method was not defined. Callers
     * should therefore be aware that third party implementations of the NodeInfo interface may
     * not implement the correct semantics. It is safer to use isSameNodeInfo() for this reason.
     * The equals() method has been defined because it is useful in contexts such as a Java Set or HashMap.
     */

    public boolean equals(Object other);

    /**
     * The hashCode() method obeys the contract for hashCode(): that is, if two objects are equal
     * (represent the same node) then they must have the same hashCode()
     * @since 8.7 Previously, the effect of the equals() and hashCode() methods was not defined. Callers
     * should therefore be aware that third party implementations of the NodeInfo interface may
     * not implement the correct semantics.
     */

    public int hashCode();

    /**
     * Get the System ID for the node. Note this is not the
     * same as the base URI: the base URI can be modified by xml:base, but
     * the system ID cannot. The base URI is used primarily for resolving
     * relative URIs within the content of the document. The system ID is
     * used primarily in conjunction with a line number, for identifying the
     * location of elements within the source XML, in particular when errors
     * are found. For a document node, the System ID represents the value of
     * the document-uri property as defined in the XDM data model.
     *
     * @return the System Identifier of the entity in the source document
     * containing the node, or null if not known or not applicable.
     * @since 8.4
     */

    /*@Nullable*/ public String getSystemId();

    /**
     * Get the Base URI for the node, that is, the URI used for resolving a relative URI contained
     * in the node. This will be the same as the System ID unless xml:base has been used. Where the
     * node does not have a base URI of its own, the base URI of its parent node is returned.
     *
     * @return the base URI of the node. This may be null if the base URI is unknown, including the case
     * where the node has no parent.
     * @since 8.4
     */

    public String getBaseURI();

    /**
     * Get line number. Line numbers are not maintained by default, except for
     * stylesheets and schema documents. Line numbering can be requested using the
     * -l option on the command line, or by setting options on the TransformerFactory
     * or the Configuration before the source document is built.
     * 

     * The granularity of line numbering is normally the element level: for other nodes
     * such as text nodes and attributes, the line number of the parent element will normally be returned.
     * 

     * In the case of a tree constructed by taking input from a SAX parser, the line number will reflect the
     * SAX rules: that is, the line number of an element is the line number where the start tag ends. This
     * may be a little confusing where elements have many attributes spread over multiple lines, or where
     * single attributes (as can easily happen with XSLT 2.0 stylesheets) occupy several lines.
     * 

     * In the case of a tree constructed by a stylesheet or query, the line number may reflect the line in
     * the stylesheet or query that caused the node to be constructed.
     * 

     * The line number can be read from within an XPath expression using the Saxon extension function
     * saxon:line-number()
     *
     * @return the line number of the node in its original source document; or
     *      -1 if not available
     * @since 8.4
     */

    public int getLineNumber();

    /**
     * Get column number. Column numbers are not maintained by default. Column numbering
     * can be requested in the same way as line numbering; but a tree implementation can ignore
     * the request.
     * 

     * The granularity of column numbering is normally the element level: for other nodes
     * such as text nodes and attributes, the line number of the parent element will normally be returned.
     * 

     * In the case of a tree constructed by taking input from a SAX parser, the column number will reflect the
     * SAX rules: that is, the column number of an element is the column number where the start tag ends. This
     * may be a little confusing where elements have many attributes spread over multiple lines, or where
     * single attributes (as can easily happen with XSLT 2.0 stylesheets) occupy several lines.
     * 

     * In the case of a tree constructed by a stylesheet or query, the column number may reflect the line in
     * the stylesheet or query that caused the node to be constructed.
     * 

     * The column number can be read from within an XPath expression using the Saxon extension function
     * saxon:column-number()
     *
     * @return the column number of the node in its original source document; or
     *      -1 if not available
     * @since 9.1
     */

    public int getColumnNumber();

    /**
     * Determine the relative position of this node and another node, in document order.
     * 

     * The other node must always be in the same tree; the effect of calling this method
     * when the two nodes are in different trees is undefined. To obtain a global ordering
     * of nodes, the application should first compare the result of getDocumentNumber(),
     * and only if the document number is the same should compareOrder() be called.
     *
     * @param other The other node, whose position is to be compared with this
     *      node
     * @return -1 if this node precedes the other node, +1 if it follows the
     *     other node, or 0 if they are the same node. (In this case,
     *     isSameNode() will always return true, and the two nodes will
     *     produce the same result for generateId())
     * @since 8.4
     */

    public int compareOrder(NodeInfo other);

    /**
     * Determine the relative position of this node and another node, in document order,
     * distinguishing whether the first node is a preceding, following, descendant, ancestor,
     * or the same node as the second.
     * 

     * The other node must always be in the same tree; the effect of calling this method
     * when the two nodes are in different trees is undefined. If either node is a namespace
     * or attribute node, the method should throw UnsupportedOperationException.
     *
     * @param other The other node, whose position is to be compared with this
     *      node
     * @return {@link AxisInfo#PRECEDING} if this node is on the preceding axis of the other node;
     * {@link AxisInfo#FOLLOWING} if it is on the following axis; {@link AxisInfo#ANCESTOR} if the first node is an
     * ancestor of the second; {@link AxisInfo#DESCENDANT} if the first is a descendant of the second;
     * {@link AxisInfo#SELF} if they are the same node.
     * @throws UnsupportedOperationException if either node is an attribute or namespace
     * @since 9.5
     */

    public int comparePosition(NodeInfo other);

    /**
     * Return the string value of the node as defined in the XPath data model.
     * 

     * The interpretation of this depends on the type
     * of node. For an element it is the accumulated character content of the element,
     * including descendant elements.
     * 

     * This method returns the string value as if the node were untyped. Unlike the string value
     * accessor in the XPath 2.0 data model, it does not report an error if the element has a complex
     * type, instead it returns the concatenation of the descendant text nodes as it would if the element
     * were untyped.
     *
     * @return the string value of the node
     * @since 8.4
     */

    public String getStringValue();

	/**
	 * Get name code. The name code is a coded form of the node name: two nodes
	 * with the same name code have the same namespace URI, the same local name,
	 * and the same prefix. By masking the name code with {@link NamePool#FP_MASK}, you get a
	 * fingerprint: two nodes with the same fingerprint have the same local name
	 * and namespace URI.
	 *
	 * @return an integer name code, which may be used to obtain the actual node
	 *     name from the name pool. For unnamed nodes (text nodes, comments, document nodes,
     *     and namespace nodes for the default namespace), returns -1.
	 * @see net.sf.saxon.om.NamePool#allocate allocate
	 * @see net.sf.saxon.om.NamePool#getFingerprint getFingerprint
     * @since 8.4
	 */

	public int getNameCode();

	/**
	 * Get fingerprint. The fingerprint is a coded form of the expanded name
	 * of the node: two nodes
	 * with the same name code have the same namespace URI and the same local name.
     * The fingerprint contains no information about the namespace prefix. For a name
     * in the null namespace, the fingerprint is the same as the name code.
	 *
	 * @return an integer fingerprint; two nodes with the same fingerprint have
	 *     the same expanded QName. For unnamed nodes (text nodes, comments, document nodes,
     *     and namespace nodes for the default namespace), returns -1.
     * @since 8.4
	 */

	public int getFingerprint();

    /**
     * Get the local part of the name of this node. This is the name after the ":" if any.
     *
     * @return the local part of the name. For an unnamed node, returns "". Unlike the DOM
     * interface, this returns the full name in the case of a non-namespaced name.
     * @since 8.4
     */

    public String getLocalPart();

    /**
     * Get the URI part of the name of this node. This is the URI corresponding to the
     * prefix, or the URI of the default namespace if appropriate.
     *
     * @return The URI of the namespace of this node. For an unnamed node,
     *     or for an element or attribute that is not in a namespace, or for a processing
     *     instruction, returns an empty string.
     * @since 8.4
     */

    public String getURI();

    /**
     * Get the display name of this node, in the form of a lexical QName.
     * For elements and attributes this is [prefix:]localname.
     * For unnamed nodes, it is an empty string.
     *
     * @return The display name of this node. For a node with no name, returns
     *     an empty string.
     * @since 8.4
     */

    public String getDisplayName();

    /**
     * Get the prefix of the name of the node. This is defined only for elements and attributes.
     * If the node has no prefix, or for other kinds of node, returns a zero-length string.
     * @return The prefix of the name of the node.
     * @since 8.4
     */

    public String getPrefix();

    /**
     * Get the configuration used to build the tree containing this node.
     * @return the Configuration
     * @since 8.4
     */

    public Configuration getConfiguration();

   /**
    * Get the NamePool that holds the namecode for this node
    * @return the namepool
    * @since 8.4
    */

    public NamePool getNamePool();

    /**
     * Get the type annotation of this node, if any. The type annotation is represented as an integer;
     * this is the fingerprint of the name of the type, as defined in the name pool. Anonymous types
     * are given a system-defined name. The value of the type annotation can be used to retrieve the
     * actual schema type definition using the method {@link Configuration#getSchemaType}.
     * 

     * The bit IS_DTD_TYPE (1<<30) will be set in the case of an attribute node if the type annotation
     * is one of ID, IDREF, or IDREFS and this is derived from DTD rather than schema validation.
     *
     * @return the type annotation of the node, under the mask NamePool.FP_MASK, and optionally the
     * bit setting IS_DTD_TYPE in the case of a DTD-derived ID or IDREF/S type (which is treated
     * as untypedAtomic for the purposes of obtaining the typed value).
     *
     * 
For elements and attributes, this is the type annotation as defined in XDM. For document
     * nodes, it should be one of XS_UNTYPED if the document has not been validated, or XS_ANY_TYPE
     * if validation has taken place (that is, if any node in the document has an annotation other than
     * Untyped or UntypedAtomic).
     * @since 8.4. Refinement for document nodes introduced in 9.2
     */

    public int getTypeAnnotation();

    /**
     * Get the type annotation of this node, if any. The type annotation is represented as
     * SchemaType object.
     *
     * Types derived from a DTD are not reflected in the result of this method.
     *
     * @return For element and attribute nodes: the type annotation derived from schema
     * validation (defaulting to xs:untyped and xs:untypedAtomic in the absence of schema
     * validation). For comments, text nodes, processing instructions, and namespaces: null.
     * For document nodes, either xs:untyped if the document has not been validated, or
     * xs:anyType if it has.
     * @since 9.4
     */

    public SchemaType getSchemaType();


    /**
     * Bit setting in the returned type annotation indicating a DTD_derived type on an attribute node
     */

    public static int IS_DTD_TYPE = 1<<30;

    /**
     * Bit setting for use alongside a type annotation indicating that the is-nilled property is set
     */

    public static int IS_NILLED = 1<<29;


    /**
     * Get the typed value. This will either be a single AtomicValue or a value whose items are
     * atomic values.
     * @since 8.5. Changed in 9.5 to return the new type AtomicSequence.
     * @throws XPathException if the node has no typed value, for example if
     * it is an element node with element-only content
     */

    public AtomicSequence atomize() throws XPathException;

    /**
     * Get the NodeInfo object representing the parent of this node
     *
     * @return the parent of this node; null if this node has no parent
     * @since 8.4
     */

    /*@Nullable*/ public NodeInfo getParent();

    /**
     * Return an iteration over all the nodes reached by the given axis from this node
     *
     * @param axisNumber an integer identifying the axis; one of the constants
     *      defined in class {@link AxisInfo}
     * @return an AxisIterator that delivers the nodes reached by the axis in
     *     turn. The nodes are returned in axis order (document order for a forwards
     *     axis, reverse document order for a reverse axis).
     * @see AxisInfo
     * @throws UnsupportedOperationException if the namespace axis is
     *     requested and this axis is not supported for this implementation.
     * @since 8.4
     */

    public AxisIterator iterateAxis(byte axisNumber);


    /**
     * Return an iteration over all the nodes reached by the given axis from this node
     * that match a given NodeTest
     *
     * @exception UnsupportedOperationException if the namespace axis is
     *      requested and this axis is not supported for this implementation.
     * @param axisNumber an integer identifying the axis; one of the constants
     *      defined in class {@link AxisInfo}
     * @param nodeTest A condition to be satisfied by the returned nodes; nodes
     *      that do not satisfy this condition are not included in the result
     * @return an AxisIterator that delivers the nodes reached by the axis in
     *     turn.  The nodes are returned in axis order (document order for a forwards
     *     axis, reverse document order for a reverse axis).
     * @see AxisInfo
     * @since 8.4
     */

    public AxisIterator iterateAxis(byte axisNumber, NodeTest nodeTest);

    /**
     * Get the string value of a given attribute of this node
     *
     * @param uri the namespace URI of the attribute name. Supply the empty string for an attribute
     * that is in no namespace
     * @param local the local part of the attribute name.
     * @return the attribute value if it exists, or null if it does not exist. Always returns null
     * if this node is not an element.
     * @since 9.4
     */

    /*@Nullable*/ public String getAttributeValue(/*@NotNull*/ String uri, /*@NotNull*/ String local);

    /**
     * Get the root node of the tree containing this node
     *
     * @return the NodeInfo representing the top-level ancestor of this node.
     *     This will not necessarily be a document node. If this node has no parent,
     *     then the method returns this node.
     * @since 8.4
     */

    public NodeInfo getRoot();

    /**
     * Get the root node, if it is a document node.
     *
     * @return the DocumentInfo representing the containing document. If this
     *     node is part of a tree that does not have a document node as its
     *     root, returns null.
     * @since 8.4
     */

    /*@Nullable*/ public DocumentInfo getDocumentRoot();

    /**
     * Determine whether the node has any children.
     * 
     * Note: the result is equivalent to 

     * iterateAxis(Axis.CHILD).next() != null
     *
     * @return True if the node has one or more children
     * @since 8.4
     */

    public boolean hasChildNodes();

    /**
     * Construct a character string that uniquely identifies this node.
     * Note: a.isSameNode(b) if and only if generateId(a)==generateId(b)
     *
     * @param buffer a buffer which will be updated to hold a string
     *     that uniquely identifies this node, across all documents.
     * @since 8.7
     *     
Changed in Saxon 8.7 to generate the ID value in a client-supplied buffer
     */

    public void generateId(FastStringBuffer buffer);

    /**
     * Get the document number of the document containing this node. For a free-standing
     * orphan node, just return the hashcode.
     * @return the document number of the document containing this node
     * @since 8.4
     */

    public long getDocumentNumber();

    /**
     * Copy this node to a given Receiver.
     * 
     * This method is primarily for internal use. It should not be considered a stable
     * part of the Saxon API.
     *
     * @param out the Receiver to which the node should be copied. It is the caller's
     *     responsibility to ensure that this Receiver is open before the method is called
     *     (or that it is self-opening), and that it is closed after use.
     * @param copyOptions a selection of the options defined in {@link net.sf.saxon.om.CopyOptions}
     * @param locationId If non-zero, identifies the location of the instruction
*     that requested this copy. If zero, indicates that the location information
     * @throws XPathException if any downstream error occurs
     */

    public void copy(Receiver out, int copyOptions, int locationId) throws XPathException;

    /**
     * Don't copy any namespace nodes.
     */

    public static final int NO_NAMESPACES = 0;

    /**
     * Copy namespaces declared (or undeclared) on this element, but not namespaces inherited from a parent element
     */
    public static final int LOCAL_NAMESPACES = 1;

    /**
     * Copy all in-scope namespaces
     */
    public static final int ALL_NAMESPACES = 2;

    /**
     * Get all namespace declarations and undeclarations defined on this element.
     * 

     * This method is intended primarily for internal use. User applications needing
     * information about the namespace context of a node should use iterateAxis(Axis.NAMESPACE).
     * (However, not all implementations support the namespace axis, whereas all implementations are
     * required to support this method.)
     *
     * @param buffer If this is non-null, and the result array fits in this buffer, then the result
     * may overwrite the contents of this array, to avoid the cost of allocating a new array on the heap.
     * @return An array of integers representing the namespace declarations and undeclarations present on
     * this element. For a node other than an element, return null. Otherwise, the returned array is a
     * sequence of namespace codes, whose meaning may be interpreted by reference to the name pool. The
     * top half word of each namespace code represents the prefix, the bottom half represents the URI.
     * If the bottom half is zero, then this is a namespace undeclaration rather than a declaration.
     * The XML namespace is never included in the list. If the supplied array is larger than required,
     * then the first unused entry will be set to -1.
     * 

     * For a node other than an element, the method returns null.
     */

    public NamespaceBinding[] getDeclaredNamespaces(/*@Nullable*/ NamespaceBinding[] buffer);

    /**
     * Determine whether this node has the is-id property
     * @return true if the node is an ID
     */

    public boolean isId();

    /**
     * Determine whether this node has the is-idref property
     * @return true if the node is an IDREF or IDREFS element or attribute
     */

    public boolean isIdref();

    /**
     * Determine whether the node has the is-nilled property
     * @return true if the node has the is-nilled property
     */

    public boolean isNilled();

}