net.sf.saxon.om.NodeInfo Maven / Gradle / Ivy
Show all versions of saxon-he Show documentation
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2013 Saxonica Limited.
// This Source Code Form is subject to the terms of the Mozilla Public License, v. 2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
// This Source Code Form is "Incompatible With Secondary Licenses", as defined by the Mozilla Public License, v. 2.0.
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
package net.sf.saxon.om;
import net.sf.saxon.Configuration;
import net.sf.saxon.event.Receiver;
import net.sf.saxon.pattern.NodeTest;
import net.sf.saxon.trans.XPathException;
import net.sf.saxon.tree.iter.AxisIterator;
import net.sf.saxon.tree.util.FastStringBuffer;
import net.sf.saxon.type.SchemaType;
import javax.xml.transform.Source;
/**
* The NodeInfo interface represents a node in Saxon's implementation of the XPath 2.0 data model.
*
* Note that several NodeInfo objects may represent the same node. To test node identity, the
* method {@link #isSameNodeInfo(NodeInfo)} should be used. An exception to this rule applies for
* document nodes, where the correspondence between document nodes and DocumentInfo objects is one to
* one. NodeInfo objects are never reused: a given NodeInfo object represents the same node for its entire
* lifetime.
*
* This is the primary interface for accessing trees in Saxon, and it forms part of the public
* Saxon API. The only subclass of NodeInfo that applications should normally use is {@link DocumentInfo},
* which represents a document node. Methods that form part of the public API are (since Saxon 8.4)
* labelled with a JavaDoc "since" tag: classes and methods that have no such label should not be
* regarded as stable interfaces.
*
* The interface represented by this class is at a slightly higher level than the abstraction described
* in the W3C data model specification, in that it includes support for the XPath axes, rather than exposing
* the lower-level properties (such as "parent" and "children") directly. All navigation within trees,
* except for a few convenience methods, is done by following the axes using the {@link #iterateAxis} method.
* This allows different implementations of the XPath tree model to implement axis navigation in different ways.
* Some implementations may choose to use the helper methods provided in class {@link net.sf.saxon.tree.util.Navigator}.
*
* Note that the stability of this interface applies to classes that use the interface,
* not to classes that implement it. The interface may be extended in future to add new methods.
*
* New implementations of NodeInfo are advised also to implement the methods in interface
* ExtendedNodeInfo, which will be moved into this interface at some time in the future.
*
* @author Michael H. Kay
* @since 8.4. Extended with three extra methods, previously in ExtendedNodeInfo, in 9.1
*/
public interface NodeInfo extends Source, Item {
/**
* Get the kind of node. This will be a value such as {@link net.sf.saxon.type.Type#ELEMENT}
* or {@link net.sf.saxon.type.Type#ATTRIBUTE}. There are seven kinds of node: documents, elements, attributes,
* text, comments, processing-instructions, and namespaces.
*
* @return an integer identifying the kind of node. These integer values are the
* same as those used in the DOM
* @see net.sf.saxon.type.Type
* @since 8.4
*/
public int getNodeKind();
/**
* Determine whether this is the same node as another node.
*
* Note that two different NodeInfo instances can represent the same conceptual node.
* Therefore the "==" operator should not be used to test node identity. The equals()
* method should give the same result as isSameNodeInfo(), but since this rule was introduced
* late it might not apply to all implementations.
*
* Note: a.isSameNodeInfo(b) if and only if generateId(a)==generateId(b).
*
* This method has the same semantics as isSameNode() in DOM Level 3, but
* works on Saxon NodeInfo objects rather than DOM Node objects.
*
* @param other the node to be compared with this node
* @return true if this NodeInfo object and the supplied NodeInfo object represent
* the same node in the tree.
*/
public boolean isSameNodeInfo(NodeInfo other);
/**
* The equals() method compares nodes for identity. It is defined to give the same result
* as isSameNodeInfo().
* @param other the node to be compared with this node
* @return true if this NodeInfo object and the supplied NodeInfo object represent
* the same node in the tree.
* @since 8.7 Previously, the effect of the equals() method was not defined. Callers
* should therefore be aware that third party implementations of the NodeInfo interface may
* not implement the correct semantics. It is safer to use isSameNodeInfo() for this reason.
* The equals() method has been defined because it is useful in contexts such as a Java Set or HashMap.
*/
public boolean equals(Object other);
/**
* The hashCode() method obeys the contract for hashCode(): that is, if two objects are equal
* (represent the same node) then they must have the same hashCode()
* @since 8.7 Previously, the effect of the equals() and hashCode() methods was not defined. Callers
* should therefore be aware that third party implementations of the NodeInfo interface may
* not implement the correct semantics.
*/
public int hashCode();
/**
* Get the System ID for the node. Note this is not the
* same as the base URI: the base URI can be modified by xml:base, but
* the system ID cannot. The base URI is used primarily for resolving
* relative URIs within the content of the document. The system ID is
* used primarily in conjunction with a line number, for identifying the
* location of elements within the source XML, in particular when errors
* are found. For a document node, the System ID represents the value of
* the document-uri property as defined in the XDM data model.
*
* @return the System Identifier of the entity in the source document
* containing the node, or null if not known or not applicable.
* @since 8.4
*/
/*@Nullable*/ public String getSystemId();
/**
* Get the Base URI for the node, that is, the URI used for resolving a relative URI contained
* in the node. This will be the same as the System ID unless xml:base has been used. Where the
* node does not have a base URI of its own, the base URI of its parent node is returned.
*
* @return the base URI of the node. This may be null if the base URI is unknown, including the case
* where the node has no parent.
* @since 8.4
*/
public String getBaseURI();
/**
* Get line number. Line numbers are not maintained by default, except for
* stylesheets and schema documents. Line numbering can be requested using the
* -l option on the command line, or by setting options on the TransformerFactory
* or the Configuration before the source document is built.
*
* The granularity of line numbering is normally the element level: for other nodes
* such as text nodes and attributes, the line number of the parent element will normally be returned.
*
* In the case of a tree constructed by taking input from a SAX parser, the line number will reflect the
* SAX rules: that is, the line number of an element is the line number where the start tag ends. This
* may be a little confusing where elements have many attributes spread over multiple lines, or where
* single attributes (as can easily happen with XSLT 2.0 stylesheets) occupy several lines.
*
* In the case of a tree constructed by a stylesheet or query, the line number may reflect the line in
* the stylesheet or query that caused the node to be constructed.
*
* The line number can be read from within an XPath expression using the Saxon extension function
* saxon:line-number()
*
* @return the line number of the node in its original source document; or
* -1 if not available
* @since 8.4
*/
public int getLineNumber();
/**
* Get column number. Column numbers are not maintained by default. Column numbering
* can be requested in the same way as line numbering; but a tree implementation can ignore
* the request.
*
* The granularity of column numbering is normally the element level: for other nodes
* such as text nodes and attributes, the line number of the parent element will normally be returned.
*
* In the case of a tree constructed by taking input from a SAX parser, the column number will reflect the
* SAX rules: that is, the column number of an element is the column number where the start tag ends. This
* may be a little confusing where elements have many attributes spread over multiple lines, or where
* single attributes (as can easily happen with XSLT 2.0 stylesheets) occupy several lines.
*
* In the case of a tree constructed by a stylesheet or query, the column number may reflect the line in
* the stylesheet or query that caused the node to be constructed.
*
* The column number can be read from within an XPath expression using the Saxon extension function
* saxon:column-number()
*
* @return the column number of the node in its original source document; or
* -1 if not available
* @since 9.1
*/
public int getColumnNumber();
/**
* Determine the relative position of this node and another node, in document order.
*
* The other node must always be in the same tree; the effect of calling this method
* when the two nodes are in different trees is undefined. To obtain a global ordering
* of nodes, the application should first compare the result of getDocumentNumber(),
* and only if the document number is the same should compareOrder() be called.
*
* @param other The other node, whose position is to be compared with this
* node
* @return -1 if this node precedes the other node, +1 if it follows the
* other node, or 0 if they are the same node. (In this case,
* isSameNode() will always return true, and the two nodes will
* produce the same result for generateId())
* @since 8.4
*/
public int compareOrder(NodeInfo other);
/**
* Determine the relative position of this node and another node, in document order,
* distinguishing whether the first node is a preceding, following, descendant, ancestor,
* or the same node as the second.
*
* The other node must always be in the same tree; the effect of calling this method
* when the two nodes are in different trees is undefined. If either node is a namespace
* or attribute node, the method should throw UnsupportedOperationException.
*
* @param other The other node, whose position is to be compared with this
* node
* @return {@link AxisInfo#PRECEDING} if this node is on the preceding axis of the other node;
* {@link AxisInfo#FOLLOWING} if it is on the following axis; {@link AxisInfo#ANCESTOR} if the first node is an
* ancestor of the second; {@link AxisInfo#DESCENDANT} if the first is a descendant of the second;
* {@link AxisInfo#SELF} if they are the same node.
* @throws UnsupportedOperationException if either node is an attribute or namespace
* @since 9.5
*/
public int comparePosition(NodeInfo other);
/**
* Return the string value of the node as defined in the XPath data model.
*
* The interpretation of this depends on the type
* of node. For an element it is the accumulated character content of the element,
* including descendant elements.
*
* This method returns the string value as if the node were untyped. Unlike the string value
* accessor in the XPath 2.0 data model, it does not report an error if the element has a complex
* type, instead it returns the concatenation of the descendant text nodes as it would if the element
* were untyped.
*
* @return the string value of the node
* @since 8.4
*/
public String getStringValue();
/**
* Get name code. The name code is a coded form of the node name: two nodes
* with the same name code have the same namespace URI, the same local name,
* and the same prefix. By masking the name code with {@link NamePool#FP_MASK}, you get a
* fingerprint: two nodes with the same fingerprint have the same local name
* and namespace URI.
*
* @return an integer name code, which may be used to obtain the actual node
* name from the name pool. For unnamed nodes (text nodes, comments, document nodes,
* and namespace nodes for the default namespace), returns -1.
* @see net.sf.saxon.om.NamePool#allocate allocate
* @see net.sf.saxon.om.NamePool#getFingerprint getFingerprint
* @since 8.4
*/
public int getNameCode();
/**
* Get fingerprint. The fingerprint is a coded form of the expanded name
* of the node: two nodes
* with the same name code have the same namespace URI and the same local name.
* The fingerprint contains no information about the namespace prefix. For a name
* in the null namespace, the fingerprint is the same as the name code.
*
* @return an integer fingerprint; two nodes with the same fingerprint have
* the same expanded QName. For unnamed nodes (text nodes, comments, document nodes,
* and namespace nodes for the default namespace), returns -1.
* @since 8.4
*/
public int getFingerprint();
/**
* Get the local part of the name of this node. This is the name after the ":" if any.
*
* @return the local part of the name. For an unnamed node, returns "". Unlike the DOM
* interface, this returns the full name in the case of a non-namespaced name.
* @since 8.4
*/
public String getLocalPart();
/**
* Get the URI part of the name of this node. This is the URI corresponding to the
* prefix, or the URI of the default namespace if appropriate.
*
* @return The URI of the namespace of this node. For an unnamed node,
* or for an element or attribute that is not in a namespace, or for a processing
* instruction, returns an empty string.
* @since 8.4
*/
public String getURI();
/**
* Get the display name of this node, in the form of a lexical QName.
* For elements and attributes this is [prefix:]localname.
* For unnamed nodes, it is an empty string.
*
* @return The display name of this node. For a node with no name, returns
* an empty string.
* @since 8.4
*/
public String getDisplayName();
/**
* Get the prefix of the name of the node. This is defined only for elements and attributes.
* If the node has no prefix, or for other kinds of node, returns a zero-length string.
* @return The prefix of the name of the node.
* @since 8.4
*/
public String getPrefix();
/**
* Get the configuration used to build the tree containing this node.
* @return the Configuration
* @since 8.4
*/
public Configuration getConfiguration();
/**
* Get the NamePool that holds the namecode for this node
* @return the namepool
* @since 8.4
*/
public NamePool getNamePool();
/**
* Get the type annotation of this node, if any. The type annotation is represented as an integer;
* this is the fingerprint of the name of the type, as defined in the name pool. Anonymous types
* are given a system-defined name. The value of the type annotation can be used to retrieve the
* actual schema type definition using the method {@link Configuration#getSchemaType}.
*
* The bit IS_DTD_TYPE (1<<30) will be set in the case of an attribute node if the type annotation
* is one of ID, IDREF, or IDREFS and this is derived from DTD rather than schema validation.
*
* @return the type annotation of the node, under the mask NamePool.FP_MASK, and optionally the
* bit setting IS_DTD_TYPE in the case of a DTD-derived ID or IDREF/S type (which is treated
* as untypedAtomic for the purposes of obtaining the typed value).
*
*
For elements and attributes, this is the type annotation as defined in XDM. For document
* nodes, it should be one of XS_UNTYPED if the document has not been validated, or XS_ANY_TYPE
* if validation has taken place (that is, if any node in the document has an annotation other than
* Untyped or UntypedAtomic).
* @since 8.4. Refinement for document nodes introduced in 9.2
*/
public int getTypeAnnotation();
/**
* Get the type annotation of this node, if any. The type annotation is represented as
* SchemaType object.
*
* Types derived from a DTD are not reflected in the result of this method.
*
* @return For element and attribute nodes: the type annotation derived from schema
* validation (defaulting to xs:untyped and xs:untypedAtomic in the absence of schema
* validation). For comments, text nodes, processing instructions, and namespaces: null.
* For document nodes, either xs:untyped if the document has not been validated, or
* xs:anyType if it has.
* @since 9.4
*/
public SchemaType getSchemaType();
/**
* Bit setting in the returned type annotation indicating a DTD_derived type on an attribute node
*/
public static int IS_DTD_TYPE = 1<<30;
/**
* Bit setting for use alongside a type annotation indicating that the is-nilled property is set
*/
public static int IS_NILLED = 1<<29;
/**
* Get the typed value. This will either be a single AtomicValue or a value whose items are
* atomic values.
* @since 8.5. Changed in 9.5 to return the new type AtomicSequence.
* @throws XPathException if the node has no typed value, for example if
* it is an element node with element-only content
*/
public AtomicSequence atomize() throws XPathException;
/**
* Get the NodeInfo object representing the parent of this node
*
* @return the parent of this node; null if this node has no parent
* @since 8.4
*/
/*@Nullable*/ public NodeInfo getParent();
/**
* Return an iteration over all the nodes reached by the given axis from this node
*
* @param axisNumber an integer identifying the axis; one of the constants
* defined in class {@link AxisInfo}
* @return an AxisIterator that delivers the nodes reached by the axis in
* turn. The nodes are returned in axis order (document order for a forwards
* axis, reverse document order for a reverse axis).
* @see AxisInfo
* @throws UnsupportedOperationException if the namespace axis is
* requested and this axis is not supported for this implementation.
* @since 8.4
*/
public AxisIterator iterateAxis(byte axisNumber);
/**
* Return an iteration over all the nodes reached by the given axis from this node
* that match a given NodeTest
*
* @exception UnsupportedOperationException if the namespace axis is
* requested and this axis is not supported for this implementation.
* @param axisNumber an integer identifying the axis; one of the constants
* defined in class {@link AxisInfo}
* @param nodeTest A condition to be satisfied by the returned nodes; nodes
* that do not satisfy this condition are not included in the result
* @return an AxisIterator that delivers the nodes reached by the axis in
* turn. The nodes are returned in axis order (document order for a forwards
* axis, reverse document order for a reverse axis).
* @see AxisInfo
* @since 8.4
*/
public AxisIterator iterateAxis(byte axisNumber, NodeTest nodeTest);
/**
* Get the string value of a given attribute of this node
*
* @param uri the namespace URI of the attribute name. Supply the empty string for an attribute
* that is in no namespace
* @param local the local part of the attribute name.
* @return the attribute value if it exists, or null if it does not exist. Always returns null
* if this node is not an element.
* @since 9.4
*/
/*@Nullable*/ public String getAttributeValue(/*@NotNull*/ String uri, /*@NotNull*/ String local);
/**
* Get the root node of the tree containing this node
*
* @return the NodeInfo representing the top-level ancestor of this node.
* This will not necessarily be a document node. If this node has no parent,
* then the method returns this node.
* @since 8.4
*/
public NodeInfo getRoot();
/**
* Get the root node, if it is a document node.
*
* @return the DocumentInfo representing the containing document. If this
* node is part of a tree that does not have a document node as its
* root, returns null.
* @since 8.4
*/
/*@Nullable*/ public DocumentInfo getDocumentRoot();
/**
* Determine whether the node has any children.
*
* Note: the result is equivalent to
* iterateAxis(Axis.CHILD).next() != null
*
* @return True if the node has one or more children
* @since 8.4
*/
public boolean hasChildNodes();
/**
* Construct a character string that uniquely identifies this node.
* Note: a.isSameNode(b) if and only if generateId(a)==generateId(b)
*
* @param buffer a buffer which will be updated to hold a string
* that uniquely identifies this node, across all documents.
* @since 8.7
*
Changed in Saxon 8.7 to generate the ID value in a client-supplied buffer
*/
public void generateId(FastStringBuffer buffer);
/**
* Get the document number of the document containing this node. For a free-standing
* orphan node, just return the hashcode.
* @return the document number of the document containing this node
* @since 8.4
*/
public long getDocumentNumber();
/**
* Copy this node to a given Receiver.
*
* This method is primarily for internal use. It should not be considered a stable
* part of the Saxon API.
*
* @param out the Receiver to which the node should be copied. It is the caller's
* responsibility to ensure that this Receiver is open before the method is called
* (or that it is self-opening), and that it is closed after use.
* @param copyOptions a selection of the options defined in {@link net.sf.saxon.om.CopyOptions}
* @param locationId If non-zero, identifies the location of the instruction
* that requested this copy. If zero, indicates that the location information
* @throws XPathException if any downstream error occurs
*/
public void copy(Receiver out, int copyOptions, int locationId) throws XPathException;
/**
* Don't copy any namespace nodes.
*/
public static final int NO_NAMESPACES = 0;
/**
* Copy namespaces declared (or undeclared) on this element, but not namespaces inherited from a parent element
*/
public static final int LOCAL_NAMESPACES = 1;
/**
* Copy all in-scope namespaces
*/
public static final int ALL_NAMESPACES = 2;
/**
* Get all namespace declarations and undeclarations defined on this element.
*
* This method is intended primarily for internal use. User applications needing
* information about the namespace context of a node should use iterateAxis(Axis.NAMESPACE)
.
* (However, not all implementations support the namespace axis, whereas all implementations are
* required to support this method.)
*
* @param buffer If this is non-null, and the result array fits in this buffer, then the result
* may overwrite the contents of this array, to avoid the cost of allocating a new array on the heap.
* @return An array of integers representing the namespace declarations and undeclarations present on
* this element. For a node other than an element, return null. Otherwise, the returned array is a
* sequence of namespace codes, whose meaning may be interpreted by reference to the name pool. The
* top half word of each namespace code represents the prefix, the bottom half represents the URI.
* If the bottom half is zero, then this is a namespace undeclaration rather than a declaration.
* The XML namespace is never included in the list. If the supplied array is larger than required,
* then the first unused entry will be set to -1.
*
* For a node other than an element, the method returns null.
*/
public NamespaceBinding[] getDeclaredNamespaces(/*@Nullable*/ NamespaceBinding[] buffer);
/**
* Determine whether this node has the is-id property
* @return true if the node is an ID
*/
public boolean isId();
/**
* Determine whether this node has the is-idref property
* @return true if the node is an IDREF or IDREFS element or attribute
*/
public boolean isIdref();
/**
* Determine whether the node has the is-nilled property
* @return true if the node has the is-nilled property
*/
public boolean isNilled();
}