net.sf.saxon.event.Outputter Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of Saxon-HE Show documentation
The XSLT and XQuery Processor
There is a newer version: 12.5
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2018-2023 Saxonica Limited
// This Source Code Form is subject to the terms of the Mozilla Public License, v. 2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
// This Source Code Form is "Incompatible With Secondary Licenses", as defined by the Mozilla Public License, v. 2.0.
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////

package net.sf.saxon.event;

import net.sf.saxon.Configuration;
import net.sf.saxon.expr.parser.Loc;
import net.sf.saxon.om.*;
import net.sf.saxon.s9api.Location;
import net.sf.saxon.str.*;
import net.sf.saxon.trans.XPathException;
import net.sf.saxon.transpile.CSharpInnerClass;
import net.sf.saxon.transpile.CSharpModifiers;
import net.sf.saxon.type.SchemaType;
import net.sf.saxon.type.SimpleType;
import net.sf.saxon.value.StringValue;

/**
 * Outputter: This interface represents a recipient of XML tree-walking (push) events. It was
 * originally based on SAX2's ContentHandler, but adapted to handle additional events. Namespaces and
 * Attributes are handled by separate events following the startElement event. Schema types
 * can be defined for elements and attributes.
 *
 * The Outputter interface is an important internal interface within Saxon, and provides a powerful
 * mechanism for integrating Saxon with other applications. It has been designed with extensibility
 * and stability in mind. However, it should be considered as an interface designed primarily for
 * internal use, and not as a completely stable part of the public Saxon API.
 *
 * @since 10.0; derived from the original Outputter interface and SequenceReceiver class.
 * This interface is now used primarily for capturing the results of push-mode evaluation
 * of tree construction expressions in XSLT and XQuery.
 */

public abstract class Outputter implements Receiver {

    protected PipelineConfiguration pipelineConfiguration;
    protected String systemId = null;

    /**
     * Set the pipeline configuration
     *
     * @param pipe the pipeline configuration
     */

    @Override
    public void setPipelineConfiguration(/*@NotNull*/ PipelineConfiguration pipe) {
        this.pipelineConfiguration = pipe;
    }

    /**
     * Get the pipeline configuration
     *
     * @return the pipeline configuration
     */

    /*@NotNull*/
    @Override
    public PipelineConfiguration getPipelineConfiguration() {
        return pipelineConfiguration;
    }

    /**
     * Get the Saxon Configuration
     * @return the configuration
     */

    public final Configuration getConfiguration() {
        return pipelineConfiguration.getConfiguration();
    }

    /**
     * Set the System ID of the tree represented by this event stream
     *
     * @param systemId the system ID (which is used as the base URI of the nodes
     *                 if there is no xml:base attribute)
     */

    @Override
    public void setSystemId(String systemId) {
        this.systemId = systemId;
    }

    /**
     * Get the system ID
     *
     * @return the system ID that was supplied using the setSystemId() method
     */

    /*@Nullable*/
    @Override
    public String getSystemId() {
        return systemId;
    }


    /**
     * Notify the start of the event stream
     *
     * @throws XPathException if an error occurs
     */

    @Override
    public void open() throws XPathException {}

    /**
     * Notify the start of a document node
     *
     * @param properties bit-significant integer indicating properties of the document node.
     *                   The definitions of the bits are in class {@link ReceiverOption}
     * @throws XPathException if an error occurs
     */

    @Override
    abstract public void startDocument(int properties) throws XPathException;

    /**
     * Notify the end of a document node
     *
     * @throws XPathException if an error occurs
     */

    @Override
    abstract public void endDocument() throws XPathException;

    /**
     * Notify an unparsed entity URI.
     *
     * @param name     The name of the unparsed entity
     * @param systemID The system identifier of the unparsed entity
     * @param publicID The identifier of the unparsed entity
     * @throws XPathException if an error occurs
     */

    @Override
    public void setUnparsedEntity(String name, String systemID, String publicID) throws XPathException {}

    /**
     * Notify the start of an element. This version of startElement() must be followed
     * by calls on {@link #attribute(NodeName, SimpleType, String, Location, int)} and
     * {@link #namespace(String, NamespaceUri, int)} to supply the attributes and namespaces; these calls
     * may be terminated by a call on {@link #startContent()} but this is not mandatory.
     *
     * @param elemName   the name of the element.
     * @param typeCode   the type annotation of the element.
     * @param location   an object providing information about the module, line, and column where the node originated
     * @param properties bit-significant properties of the element node. If there are no relevant
     *                   properties, zero is supplied. The definitions of the bits are in class {@link ReceiverOption}
     * @throws XPathException if an error occurs
     */

    abstract public void startElement(NodeName elemName, SchemaType typeCode, Location location, int properties)
            throws XPathException;

    /**
     * Notify the start of an element, supplying all attributes and namespaces
     *
     * @param elemName   the name of the element.
     * @param type       the type annotation of the element.
     * @param attributes the attributes of this element
     * @param namespaces the in-scope namespaces of this element: generally this is all the in-scope
     *                   namespaces, without relying on inheriting namespaces from parent elements
     * @param location   an object providing information about the module, line, and column where the node originated
     * @param properties bit-significant properties of the element node. If there are no relevant
     *                   properties, zero is supplied. The definitions of the bits are in class {@link ReceiverOption}
     * @throws XPathException if an error occurs
     */
    @Override
    public void startElement(NodeName elemName, SchemaType type, AttributeMap attributes, NamespaceMap namespaces, Location location, int properties) throws XPathException {
        // This is a default implementation which is not particularly efficient. An Outputter that feeds
        // directly into a Receiver should try to avoid decomposing the attributes and namespaces.
        startElement(elemName, type, location, properties);
        for (NamespaceBinding ns : namespaces) {
            namespace(ns.getPrefix(), ns.getNamespaceUri(), properties);
        }
        for (AttributeInfo att : attributes) {
            attribute(att.getNodeName(), att.getType(), att.getValue(), att.getLocation(), att.getProperties());
        }
        startContent();
    }

    /**
     * Notify a namespace binding. This method is called at some point after startElement().
     * The semantics are similar to the xsl:namespace instruction in XSLT, or the namespace
     * node constructor in XQuery.
     * A namespace must not conflict with any namespaces already used for element or attribute names.
     *
     * @param prefix           The namespace prefix; zero-length string for the default namespace
     * @param namespaceUri     The namespace URI. In some cases a zero-length string may be used to
     *                         indicate a namespace undeclaration.
     * @param properties       The REJECT_DUPLICATES property: if set, the
     *                         namespace declaration will be rejected if it conflicts with a previous declaration of the same
     *                         prefix. If the property is not set, the namespace declaration will be ignored if it conflicts
     *                         with a previous declaration. This reflects the fact that when copying a tree, namespaces for child
     *                         elements are emitted before the namespaces of their parent element. Unfortunately this conflicts
     *                         with the XSLT rule for complex content construction, where the recovery action in the event of
     *                         conflicts is to take the namespace that comes last. XSLT therefore doesn't recover from this error:
     * @throws XPathException if an error occurs
     * @since changed in 10.0 to report all the in-scope namespaces for an element, and to do so
     * in a single call.
     */

    abstract public void namespace(String prefix, NamespaceUri namespaceUri, int properties) throws XPathException;

    /**
     * Output a set of namespace bindings. This should have the same effect as outputting the
     * namespace bindings individually using {@link #namespace(String, NamespaceUri, int)}, but it
     * may be more efficient. It is used only when copying an element node together with
     * all its namespaces, so less checking is needed that the namespaces form a consistent
     * and complete set
     * @param bindings the set of namespace bindings
     * @param properties any special properties. The property {@link ReceiverOption#NAMESPACE_OK}
     *                   means that no checking is needed.
     * @throws XPathException if any failure occurs
     */

    public void namespaces(NamespaceBindingSet bindings, int properties) throws XPathException {
        // Optimized in ComplexContentOutputter subclass
        for (NamespaceBinding nb: bindings) {
            namespace(nb.getPrefix(), nb.getNamespaceUri(), properties);
        }
    }

    /**
     * Notify an attribute. Attributes are notified after the startElement event, and before any
     * children. Namespaces and attributes may be intermingled.
     *
     * @param attName    The name of the attribute
     * @param typeCode   The type annotation of the attribute
     * @param value      the string value of the attribute
     * @param location  provides information such as line number and system ID.
     * @param properties Bit significant value. The following bits are defined:
     *                   
     *                   DISABLE_ESCAPING
    Disable escaping for this attribute
     *                   NO_SPECIAL_CHARACTERS
      Attribute value contains no special characters
     *                   
     * @throws IllegalStateException  attempt to output an attribute when there is no open element
     *                                start tag
     * @throws XPathException         if an error occurs
     */

    abstract public void attribute(NodeName attName, SimpleType typeCode, String value, Location location, int properties)
            throws XPathException;

    /**
     * Notify the start of the content, that is, the completion of all attributes and namespaces.
     * Note that the initial Outputter of output from XSLT instructions will not receive this event,
     * it has to detect it itself. Note that this event is reported for every element even if it has
     * no attributes, no namespaces, and no content.
     *
     * @throws XPathException if an error occurs
     */

    public void startContent() throws XPathException {}

    /**
     * Notify the end of an element. The Outputter must maintain a stack if it needs to know which
     * element is ending.
     *
     * @throws XPathException if an error occurs
     */

    @Override
    abstract public void endElement() throws XPathException;

    /**
     * Notify character data. Note that some receivers may require the character data to be
     * sent in a single event, but in general this is not a requirement.
     *
     * @param chars      The characters
     * @param location  provides information such as line number and system ID.
     * @param properties Bit significant value. The following bits are defined:
     *                   
     *                   DISABLE_ESCAPING
           Disable escaping for this text node
     *                   USE_CDATA
                  Output as a CDATA section
     *                   
     * @throws XPathException if an error occurs
     */

    @Override
    abstract public void characters(UnicodeString chars, Location location, int properties)
            throws XPathException;

    /**
     * Output a processing instruction
     *
     * @param name       The PI name. This must be a legal name (it will not be checked).
     * @param data       The data portion of the processing instruction
     * @param location   provides information such as line number and system ID.
     * @param properties Additional information about the PI.
     * @throws IllegalArgumentException the content is invalid for an XML processing instruction
     * @throws XPathException            if an error occurs
     */

    @Override
    abstract public void processingInstruction(String name, UnicodeString data, Location location, int properties)
            throws XPathException;

    /**
     * Notify a comment. Comments are only notified if they are outside the DTD.
     *
     * @param content    The content of the comment
     * @param location  provides information such as line number and system ID.
     * @param properties Additional information about the comment.
     * @throws IllegalArgumentException  the content is invalid for an XML comment
     * @throws XPathException            if an error occurs
     */

    @Override
    abstract public void comment(UnicodeString content, Location location, int properties) throws XPathException;

    /**
     * Append an arbitrary item (node, atomic value, or function) to the output. The default
     * implementation throws {@code UnsupportedOperationException}.
     * @param item           the item to be appended
     * @param locationId     the location of the calling instruction, for diagnostics
     * @param properties if the item is an element node, this indicates whether its namespaces
*                       need to be copied. Values are {@link ReceiverOption#ALL_NAMESPACES}; the default (0) means
     */

     @Override
     public void append(Item item, Location locationId, int properties) throws XPathException {
         throw new UnsupportedOperationException();
     }

    /**
     * Append an arbitrary item (node, atomic value, or function) to the output.
     * By default, if the item is an element node, it is copied with all namespaces.
     * The default implementation calls {@link #append(Item, Location, int)}, whose
     * default implementation throws {@code UnsupportedOperationException}
     *
     * @param item the item to be appended
     * @throws net.sf.saxon.trans.XPathException if the operation fails
     */

    @Override
    public void append(Item item) throws XPathException {
        append(item, Loc.NONE, ReceiverOption.ALL_NAMESPACES);
    }

    /**
     * Get a string-value consumer object that allows an item of type xs:string
     * to be appended one fragment at a time. This potentially allows operations that
     * output large strings to avoid building the entire string in memory. The default
     * implementation, however, simply assembles the string in a buffer and releases
     * the entire string on completion.
     * @return an object that accepts xs:string values via a sequence of append() calls
     * @param asTextNode set to true if the concatenated string values are to be treated
     *                   as a text node item rather than a string
     */

    @CSharpInnerClass(outer = true, extra = {"Saxon.Hej.s9api.Location loc"})
    public UniStringConsumer getStringReceiver(boolean asTextNode, Location loc) {
        if (asTextNode) {
            return new AbstractUniStringConsumer() {

                final UnicodeBuilder buffer = new UnicodeBuilder();

                @Override
                @CSharpModifiers(code={"public", "override"})
                public UniStringConsumer accept(UnicodeString chars) {
                    buffer.accept(chars);
                    return this;
                }

                @Override
                @CSharpModifiers(code = {"public", "override"})
                public void close() throws XPathException {
                    Outputter.this.characters(buffer.toUnicodeString(), loc, ReceiverOption.NONE);
                }
            };
        } else {
            return new AbstractUniStringConsumer() {

                final UnicodeBuilder buffer = new UnicodeBuilder();

                @Override
                @CSharpModifiers(code = {"public", "override"})
                public UniStringConsumer accept(UnicodeString chars) {
                    buffer.accept(chars);
                    return this;
                }

                @Override
                @CSharpModifiers(code = {"public", "override"})
                public void close() throws XPathException {
                    Outputter.this.append(new StringValue(buffer.toUnicodeString()));
                }
            };
        }
    }

    /**
     * Notify the end of the event stream
     *
     * @throws XPathException if an error occurs
     */

    @Override
    public void close() throws XPathException {}

    /**
     * Ask whether this Outputter (or the downstream pipeline) makes any use of the type annotations
     * supplied on element and attribute events. The default implementation of this method
     * returns false.
     *
     * @return true if the Outputter makes any use of this information. If false, the caller
     *         may supply untyped nodes instead of supplying the type annotation (or conversely, it may
     *         avoid stripping unwanted type annotations)
     */

    @Override
    public boolean usesTypeAnnotations() {
        return false;
    }


}