com.globalmentor.xml.XMLSerializer Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of globalmentor-xml Show documentation
GlobalMentor Java XML utility library.
The newest version!
/*
 * Copyright © 1996-2008 GlobalMentor, Inc. 
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     https://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.globalmentor.xml;

import java.io.*;
import java.util.*;
import java.util.stream.Stream;

import javax.annotation.*;

import java.nio.charset.Charset;

import com.globalmentor.io.ByteOrderMark;

import static com.globalmentor.collections.comparators.ExplicitOrderComparator.*;
import static com.globalmentor.java.CharSequences.*;
import static com.globalmentor.java.Characters.SPACE_CHAR;
import static com.globalmentor.java.Conditions.*;
import static com.globalmentor.java.Objects.*;

import com.globalmentor.java.CharSequences;
import com.globalmentor.java.Characters;

import static com.globalmentor.xml.XmlDom.*;
import static com.globalmentor.xml.def.XML.*;
import static java.lang.String.CASE_INSENSITIVE_ORDER;
import static java.nio.charset.StandardCharsets.*;
import static java.util.Comparator.*;
import static java.util.Objects.*;

import com.globalmentor.xml.def.*;

import io.confound.config.Configuration;
import io.confound.config.properties.PropertiesConfiguration;

import org.w3c.dom.*;

/**
 * Serializes an XML document to a byte-oriented output stream. Has the option of automatically formatting the output in a hierarchical structure with tabs or
 * other strings.
 * @author Garret Wilson
 * @see DefaultXmlFormatProfile
 */
public class XMLSerializer {

	/** Whether the output should be formatted. */
	public static final String OPTION_FORMAT_OUTPUT = "formatOutput";

	/** Default to unformatted output. */
	public static final boolean OPTION_FORMAT_OUTPUT_DEFAULT = false;

	/** Whether Unicode control characters should be XML-encoded. */
	public static final String OPTION_XML_ENCODE_CONTROL = "xmlEncodeControl";

	/** Default to not XML-encoding control characters. */
	public static final boolean OPTION_XML_ENCODE_CONTROL_DEFAULT = false;

	/** Whether extended characters (above 127) should be XML-encoded. */
	public static final String OPTION_XML_ENCODE_NON_ASCII = "xmlEncodeNonASCII";

	/** Default to not XML-encoding extended characters. */
	public static final boolean OPTION_XML_ENCODE_NON_ASCII_DEFAULT = false;

	/** Whether private use Unicode characters should be XML-encoded. */
	public static final String OPTION_XML_ENCODE_PRIVATE_USE = "xmlEncodePrivateUse";

	/** Default to not XML-encoding private use characters. */
	public static final boolean OPTION_XML_ENCODE_PRIVATE_USE_DEFAULT = false;

	/** Whether characters that match a one-character defined entity should be encoded using that entity. */
	public static final String OPTION_USE_DEFINED_ENTITIES = "useDefinedEntities";

	/** Default to using one-character predefined entities for encoding. */
	public static final boolean OPTION_USE_DEFINED_ENTITIES_DEFAULT = true;

	/** Whether characters that match a one-character predefined entity should be encoded using that entity. */
	public enum PredefinedEntitiesUse {
		/** Predefined entities will be used whenever possible. */
		ALWAYS,
		/** Predefined entities will be used when a character needs to be encoded. */
		AS_NEEDED,
		/** Predefined entities will never be used; a character reference will be used when a character needs to be encoded. */
		NEVER;
	}

	/** Whether characters that match a one-character predefined entity should be encoded using that entity. */
	public static final String OPTION_USE_PREDEFINED_ENTITIES = "usePredefinedEntities";

	/** Default to using one-character predefined entities for encoding as needed. */
	public static final PredefinedEntitiesUse OPTION_USE_PREDEFINED_ENTITIES_DEFAULT = PredefinedEntitiesUse.AS_NEEDED;

	private boolean bomWritten = false;

	/**
	 * Returns whether the serializer will write a byte order mark (BOM).
	 * @return Whether a BOM is written.
	 */
	public boolean isBomWritten() {
		return bomWritten;
	}

	/**
	 * Sets whether a byte order mark (BOM) is written.
	 * @implSpec This option is disabled by default.
	 * @param bomWritten Whether a BOM is written.
	 */
	public void setBomWritten(final boolean bomWritten) {
		this.bomWritten = bomWritten;
	}

	private boolean prologWritten = true;

	/**
	 * Returns whether the serializer will write an XML prolog.
	 * @return Whether an XML prolog is written.
	 */
	public boolean isPrologWritten() {
		return prologWritten;
	}

	/**
	 * Sets whether an XML prolog is written.
	 * @implSpec This option is enabled by default.
	 * @param prologWritten Whether an XML prolog is written.
	 */
	public void setPrologWritten(final boolean prologWritten) {
		this.prologWritten = prologWritten;
	}

	private boolean formatted = OPTION_FORMAT_OUTPUT_DEFAULT;

	/** @return Whether the output should be formatted. */
	public boolean isFormatted() {
		return formatted;
	}

	/**
	 * Sets whether the output should be formatted.
	 * @implSpec This option defaults to {@value #OPTION_FORMAT_OUTPUT_DEFAULT}.
	 * @param newFormatted true if the output should be formatted, else false.
	 */
	public void setFormatted(final boolean newFormatted) {
		formatted = newFormatted;
	}

	private boolean xmlEncodeControl = OPTION_XML_ENCODE_CONTROL_DEFAULT;

	/**
	 * @return Whether Unicode control characters should be XML-encoded.
	 * @see #isUseDefinedEntities()
	 */
	public boolean isXMLEncodeControl() {
		return xmlEncodeControl;
	}

	/**
	 * Sets whether Unicode control characters should be XML-encoded.
	 * @implSpec This option defaults to {@value #OPTION_XML_ENCODE_CONTROL_DEFAULT}.
	 * @param newXMLEncodeControl true if control characters should be XML-encoded, else false.
	 * @see #setUseDefinedEntities(boolean)
	 */
	public void setXMLEncodeControl(final boolean newXMLEncodeControl) {
		xmlEncodeControl = newXMLEncodeControl;
	}

	private boolean xmlEncodeNonASCII = OPTION_XML_ENCODE_NON_ASCII_DEFAULT;

	/**
	 * @return Whether extended characters (above 127) should be XML-encoded.
	 * @see #isUseDefinedEntities()
	 */
	public boolean isXmlEncodeNonAscii() {
		return xmlEncodeNonASCII;
	}

	/**
	 * Sets whether extended characters (above 127) should be XML-encoded.
	 * @implSpec This option defaults to {@value #OPTION_XML_ENCODE_NON_ASCII_DEFAULT}.
	 * @param newXmlEncodeNonAscii true if extended characters should be XML-encoded, else false.
	 * @see #setUseDefinedEntities(boolean)
	 */
	public void setXMLEncodeNonASCII(final boolean newXmlEncodeNonAscii) {
		xmlEncodeNonASCII = newXmlEncodeNonAscii;
	}

	private boolean xmlEncodePrivateUse = OPTION_XML_ENCODE_PRIVATE_USE_DEFAULT;

	/**
	 * @return Whether private use Unicode characters should be XML-encoded.
	 * @see #isUseDefinedEntities()
	 */
	public boolean isXMLEncodePrivateUse() {
		return xmlEncodePrivateUse;
	}

	/**
	 * Sets whether private use Unicode characters should be XML-encoded.
	 * @implSpec This option defaults to {@value #OPTION_XML_ENCODE_PRIVATE_USE_DEFAULT}.
	 * @param newXmlEncodePrivateUse true if private use characters should be XML-encoded, else false.
	 * @see #setUseDefinedEntities(boolean)
	 */
	public void setXMLEncodePrivateUse(final boolean newXmlEncodePrivateUse) {
		xmlEncodePrivateUse = newXmlEncodePrivateUse;
	}

	private boolean useDefinedEntities = OPTION_USE_DEFINED_ENTITIES_DEFAULT;

	/**
	 * @return Whether one-character entities will be used when possible.
	 * @see #isXMLEncodeControl()
	 */
	public boolean isUseDefinedEntities() {
		return useDefinedEntities;
	}

	/**
	 * Sets whether characters that match a one-character entity should be encoded using that entity. This will override the XML-encoding settings when
	 * applicable.
	 * @implSpec This option defaults to {@value #OPTION_USE_DEFINED_ENTITIES_DEFAULT}.
	 * @param newUseDefinedEntities true if available entities should be used to encode characters.
	 * @see #setXMLEncodeControl(boolean)
	 */
	public void setUseDefinedEntities(final boolean newUseDefinedEntities) {
		useDefinedEntities = newUseDefinedEntities;
	}

	private PredefinedEntitiesUse usePredefinedEntities = OPTION_USE_PREDEFINED_ENTITIES_DEFAULT;

	/**
	 * @return Whether one-character entities will be used.
	 * @see #isXMLEncodeControl()
	 */
	public PredefinedEntitiesUse getUsePredefinedEntities() {
		return usePredefinedEntities;
	}

	/**
	 * Sets whether characters that match a one-character predefined entity should be encoded using that entity. This will override the XML-encoding settings when
	 * applicable.
	 * @implSpec This option defaults to {@link #OPTION_USE_PREDEFINED_ENTITIES_DEFAULT}.
	 * @param newUsePredefinedEntities true if predefined entities should be used to encode characters.
	 * @see #setXMLEncodeControl(boolean)
	 */
	public void setUsePredefinedEntities(@Nonnull final PredefinedEntitiesUse newUsePredefinedEntities) {
		usePredefinedEntities = requireNonNull(newUsePredefinedEntities);
	}

	private boolean namespacesDeclarationsEnsured = true;

	/** @return Whether missing namespaces declarations should be added. */
	public boolean isNamespacesDeclarationsEnsured() {
		return namespacesDeclarationsEnsured;
	}

	/**
	 * Sets whether missing namespace declarations are added.
	 * @implSpec This option is enabled by default.
	 * @param namespacesDeclarationsEnsured Whether missing namespaces declarations should be added.
	 */
	public void setNamespacesDeclarationsEnsured(final boolean namespacesDeclarationsEnsured) {
		this.namespacesDeclarationsEnsured = namespacesDeclarationsEnsured;
	}

	/** Whether missing namespaces declarations should be added to the document element if possible, rather than the top-level element needing the declaration. */
	private boolean namespacesDocumentElementDeclarations = true;

	/**
	 * @return Whether missing namespaces declarations should be added to the document element if possible, rather than the top-level element needing the
	 *         declaration.
	 */
	public boolean isNamespacesDocumentElementDeclarations() {
		return namespacesDocumentElementDeclarations;
	}

	/**
	 * Sets whether missing namespace declarations are added to the document element if possible, or to the top-level element needing the declaration.
	 * @implSpec This option is enabled by default.
	 * @param namespacesDocumentElementDeclarations Whether missing namespaces declarations should be added to the document element if possible, rather than the
	 *          top-level element needing the declaration.
	 */
	public void setNamespacesDocumentElementDeclarations(final boolean namespacesDocumentElementDeclarations) {
		this.namespacesDocumentElementDeclarations = namespacesDocumentElementDeclarations;
	}

	/**
	 * Sets the options based on the contents of the option properties.
	 * @param options The properties which contain the options.
	 */
	public void setOptions(@Nonnull final Properties options) {
		final Configuration config = new PropertiesConfiguration(options); //TODO switch to passing Configuration
		setFormatted(config.findBoolean(OPTION_FORMAT_OUTPUT).orElse(OPTION_FORMAT_OUTPUT_DEFAULT));
		setUseDefinedEntities(config.findBoolean(OPTION_USE_DEFINED_ENTITIES).orElse(OPTION_USE_DEFINED_ENTITIES_DEFAULT));
		setUsePredefinedEntities(
				config.findObject(OPTION_USE_PREDEFINED_ENTITIES).flatMap(asInstance(PredefinedEntitiesUse.class)).orElse(OPTION_USE_PREDEFINED_ENTITIES_DEFAULT));
		setXMLEncodeControl(config.findBoolean(OPTION_XML_ENCODE_CONTROL).orElse(OPTION_XML_ENCODE_CONTROL_DEFAULT));
		setXMLEncodeNonASCII(config.findBoolean(OPTION_XML_ENCODE_NON_ASCII).orElse(OPTION_XML_ENCODE_NON_ASCII_DEFAULT));
		setXMLEncodePrivateUse(config.findBoolean(OPTION_XML_ENCODE_PRIVATE_USE).orElse(OPTION_XML_ENCODE_PRIVATE_USE_DEFAULT));
	}

	private CharSequence horizontalAligner = "\t";

	/**
	 * @return The character sequence to use for horizontally aligning the elements if formatting is turned on.
	 * @see #isFormatted()
	 */
	public CharSequence getHorizontalAligner() {
		return horizontalAligner;
	}

	/**
	 * Sets the character to use for horizontally aligning the elements if formatting is turned on.
	 * @implSpec The default is a single tab character.
	 * @implSpec This method delegates to {@link #setHorizontalAligner(CharSequence)}.
	 * @param horizontalAligner The horizontal alignment character.
	 * @see #setFormatted(boolean)
	 */
	public void setHorizontalAligner(final char horizontalAligner) {
		setHorizontalAligner(String.valueOf(horizontalAligner));
	}

	/**
	 * Sets the character sequence to use for horizontally aligning the elements if formatting is turned on.
	 * @implSpec The default is a single tab character.
	 * @param horizontalAligner The horizontal alignment character sequence.
	 * @see #setFormatted(boolean)
	 */
	public void setHorizontalAligner(final CharSequence horizontalAligner) {
		this.horizontalAligner = horizontalAligner;
	}

	private CharSequence lineSeparator = System.lineSeparator();

	/**
	 * Returns the character sequence to use to separate lines; that is, for newlines or line breaks.
	 * @return The newline delimiter to use.
	 * @see System#lineSeparator()
	 */
	public CharSequence getLineSeparator() {
		return lineSeparator;
	}

	/**
	 * Sets the character sequence to use to separate lines; that is, for newlines or line breaks.
	 * @implSpec The default is the system line separator {@link System#lineSeparator()}.
	 * @param lineSeparator The newline delimiter to use.
	 * @see System#lineSeparator()
	 */
	public void setLineSeparator(@Nonnull final CharSequence lineSeparator) {
		this.lineSeparator = requireNonNull(lineSeparator);
	}

	private boolean formatEndNewline = true;

	/**
	 * Returns whether an ending newline will be added if formatting is enabled.
	 * @return Whether the formatted XML will end with a newline.
	 * @see #isFormatted()
	 * @see #getLineSeparator()
	 */
	public boolean isFormatEndNewline() {
		return formatEndNewline;
	}

	/**
	 * Sets whether an ultimate newline will be appended if formatting is enabled.
	 * @implSpec This option is enabled by default.
	 * @param formatEndNewline Whether a newline will be added at the end.
	 * @see #isFormatted()
	 * @see #getLineSeparator()
	 */
	public void setFormatEndNewline(final boolean formatEndNewline) {
		this.formatEndNewline = formatEndNewline;
	}

	/** The current level of indenting during document serialization if output is formatted. */
	private int indent = -1;

	/** @return The current indent level, or 0 indicating no indention. */
	protected int getIndent() {
		return indent;
	}

	/**
	 * Increases the indent level;
	 * @return The new indent level;
	 */
	protected int indent() {
		return ++indent;
	}

	/**
	 * Reduces the indent level.
	 * @return The new indent level.
	 * @throws IllegalStateException If the indent level is already at zero.
	 */
	protected int unindent() {
		checkState(indent > 0, "Attempted to negatively indent.");
		return --indent;
	}

	/** Resets the indent level to zero. */
	protected void resetIndent() {
		indent = 0;
	}

	/**
	 * The string representing one-character entity values defined in the document. The {@link #entityNames} array will contain the names of the corresponding
	 * entities, each at the same index as the corresponding character value.
	 * @see #entityNames
	 */
	private String entityCharacterValues;

	/**
	 * An array of names corresponding to character values in the entityCharacterValue string at the same indexes.
	 * @see #entityCharacterValues
	 */
	private String[] entityNames;

	/** Default constructor for unformatted output. */
	public XMLSerializer() {
		this(false);
	}

	/**
	 * Constructor that specifies serialize options.
	 * @param options The options to use for serialization.
	 */
	public XMLSerializer(final Properties options) {
		this(false); //do the default construction
		setOptions(options); //set the options from the properties
	}

	/**
	 * Constructor for an optionally formatted serializer using the {@link DefaultXmlFormatProfile#INSTANCE} format profile.
	 * @param formatted Whether the serializer should be formatted.
	 */
	public XMLSerializer(final boolean formatted) {
		this(formatted, DefaultXmlFormatProfile.INSTANCE);
	}

	private final XmlFormatProfile formatProfile;

	/** @return The characterization of the content for formatting purposes. */
	protected XmlFormatProfile getFormatProfile() {
		return formatProfile;
	}

	/**
	 * Constructor for an optionally formatted serializer.
	 * @param formatted Whether the serializer should be formatted.
	 * @param formatProfile The profile to use to guide formatting.
	 */
	public XMLSerializer(final boolean formatted, @Nonnull final XmlFormatProfile formatProfile) {
		initializeEntityLookup(null); //always initialize the entity lookup, so that at least the five XML entities will be included in the table in case they serialize only part of a document TODO fix better so that serializing part of the document somehow initializes these
		setFormatted(formatted); //set whether the output should be formatted
		this.formatProfile = requireNonNull(formatProfile);
	}

	/**
	 * Serializes the specified document to a string using the UTF-8 encoding.
	 * @apiNote Whether a byte order mark is written depends on the setting of {@link #isBomWritten()}; normally this should be set to false when
	 *          writing to a string.
	 * @param document The XML document to serialize.
	 * @return A string containing the serialized XML data.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the UTF-8 encoding not recognized.
	 * @see #setBomWritten(boolean)
	 */
	public String serialize(@Nonnull final Document document) throws UnsupportedEncodingException, IOException {
		return serialize(document, document.getDoctype());
	}

	/**
	 * Serializes the specified document to a string using the UTF-8 encoding.
	 * @apiNote This method replaces the given document's doctype altogether, even if null is indicated for both public and system identifiers.
	 * @apiNote Whether a byte order mark is written depends on the setting of {@link #isBomWritten()}; normally this should be set to false when
	 *          writing to a string.
	 * @param document The XML document to serialize.
	 * @param publicId The external subset public identifier to use instead of that specified by the document, or null if none should be included.
	 * @param systemId The external subset system identifier to use instead of that specified by the document, or null if none should be included.
	 * @return A string containing the serialized XML data.
	 * @throws IllegalArgumentException if a public ID was given with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the UTF-8 encoding not recognized.
	 * @see #setBomWritten(boolean)
	 */
	public String serialize(@Nonnull final Document document, @Nullable final String publicId, @Nullable final String systemId)
			throws UnsupportedEncodingException, IOException {
		checkArgument(!(publicId != null && systemId == null), "A system ID must be given with public ID `%s`.", publicId);
		return serialize(document, document.getImplementation().createDocumentType(document.getDocumentElement().getNodeName(), publicId, systemId));
	}

	/**
	 * Serializes the specified document to a string using the UTF-8 encoding.
	 * @apiNote Whether a byte order mark is written depends on the setting of {@link #isBomWritten()}; normally this should be set to false when
	 *          writing to a string.
	 * @param document The XML document to serialize.
	 * @param documentType The document type to use for the document, or null if no document type should be used.
	 * @return A string containing the serialized XML data.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the UTF-8 encoding not recognized.
	 * @see #setBomWritten(boolean)
	 */
	public String serialize(@Nonnull final Document document, @Nullable final DocumentType documentType) throws UnsupportedEncodingException, IOException {
		try {
			final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream(); //create an output stream for receiving the XML data
			serialize(document, documentType, byteArrayOutputStream, UTF_8); //serialize the document to the output stream using UTF-8
			return byteArrayOutputStream.toString(UTF_8); //convert the byte array to a string, using the UTF-8 encoding, and return it
		} catch(final UnsupportedEncodingException unsupportedEncodingException) { //UTF-8 should always be supported
			throw new AssertionError(unsupportedEncodingException);
		} catch(final IOException ioException) { //there should never by an I/O exception writing to a byte array output stream
			throw new AssertionError(ioException);
		}
	}

	/**
	 * Serializes the specified document fragment to a string using the UTF-8 encoding.
	 * @apiNote Whether a byte order mark is written depends on the setting of {@link #isBomWritten()}; normally this should be set to false when
	 *          writing to a string.
	 * @param documentFragment The XML document fragment to serialize.
	 * @return A string containing the serialized XML data.
	 * @see #setBomWritten(boolean)
	 */
	public String serialize(@Nonnull final DocumentFragment documentFragment) {
		try {
			final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream(); //create an output stream for receiving the XML data
			serialize(documentFragment, byteArrayOutputStream, UTF_8); //serialize the document fragment to the output stream using UTF-8
			return byteArrayOutputStream.toString(UTF_8); //convert the byte array to a string, using the UTF-8 encoding, and return it
		} catch(final UnsupportedEncodingException unsupportedEncodingException) { //UTF-8 should always be supported
			throw new AssertionError(unsupportedEncodingException);
		} catch(final IOException ioException) { //there should never by an I/O exception writing to a byte array output stream
			throw new AssertionError(ioException);
		}
	}

	/**
	 * Serializes the specified element to a string using the UTF-8 encoding.
	 * @apiNote Whether a byte order mark is written depends on the setting of {@link #isBomWritten()}; normally this should be set to false when
	 *          writing to a string.
	 * @param element The XML element to serialize.
	 * @return A string containing the serialized XML data.
	 * @see #setBomWritten(boolean)
	 */
	public String serialize(@Nonnull final Element element) {
		try {
			final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream(); //create an output stream for receiving the XML data
			serialize(element, byteArrayOutputStream, UTF_8); //serialize the element to the output stream using UTF-8
			return byteArrayOutputStream.toString(UTF_8); //convert the byte array to a string, using the UTF-8 encoding, and return it
		} catch(final UnsupportedEncodingException unsupportedEncodingException) { //UTF-8 should always be supported
			throw new AssertionError(unsupportedEncodingException);
		} catch(final IOException ioException) { //there should never by an I/O exception writing to a byte array output stream
			throw new AssertionError(ioException);
		}
	}

	/**
	 * Serializes the content (all child nodes and their descendants) of a specified node to a string using the UTF-8 encoding. A newline will be appended at the
	 * end if {@link #isFormatted()} is turned on and {@link #isFormatEndNewline()} is enabled.
	 * @apiNote Whether a byte order mark is written depends on the setting of {@link #isBomWritten()}; normally this should be set to false when
	 *          writing to a string.
	 * @param node The XML node the content of which to serialize—usually an element or document fragment.
	 * @return A string containing the serialized XML data.
	 * @see #setBomWritten(boolean)
	 */
	public String serializeContent(@Nonnull final Node node) {
		try {
			final ByteArrayOutputStream byteArrayOutputStream = new ByteArrayOutputStream(); //create an output stream for receiving the XML data
			serializeContent(node, byteArrayOutputStream, UTF_8); //serialize the node content to the output stream using UTF-8
			return byteArrayOutputStream.toString(UTF_8); //convert the byte array to a string, using the UTF-8 encoding, and return it
		} catch(final UnsupportedEncodingException unsupportedEncodingException) { //UTF-8 should always be supported
			throw new AssertionError(unsupportedEncodingException);
		} catch(final IOException ioException) { //there should never by an I/O exception writing to a byte array output stream
			throw new AssertionError(ioException);
		}
	}

	/**
	 * Serializes the specified document to the given output stream using the UTF-8 encoding.
	 * @param document The XML document to serialize.
	 * @param outputStream The stream into which the document should be serialized.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	public void serialize(@Nonnull final Document document, @Nonnull final OutputStream outputStream) throws IOException {
		serialize(document, document.getDoctype(), outputStream);
	}

	/**
	 * Serializes the specified document to the given output stream using the UTF-8 encoding.
	 * @param document The XML document to serialize.
	 * @param publicId The external subset public identifier to use instead of that specified by the document, or null if none should be included.
	 * @param systemId The external subset system identifier to use instead of that specified by the document, or null if none should be included.
	 * @param outputStream The stream into which the document should be serialized.
	 * @throws IllegalArgumentException if a public ID was given with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	public void serialize(@Nonnull final Document document, @Nullable final String publicId, @Nullable final String systemId,
			@Nonnull final OutputStream outputStream) throws IOException {
		checkArgument(!(publicId != null && systemId == null), "A system ID must be given with public ID `%s`.", publicId);
		serialize(document, document.getImplementation().createDocumentType(document.getDocumentElement().getNodeName(), publicId, systemId), outputStream);
	}

	/**
	 * Serializes the specified document to the given output stream using the UTF-8 encoding.
	 * @param document The XML document to serialize.
	 * @param documentType The document type to use for the document, or null if no document type should be used.
	 * @param outputStream The stream into which the document should be serialized.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	public void serialize(@Nonnull final Document document, @Nullable final DocumentType documentType, @Nonnull final OutputStream outputStream)
			throws IOException {
		serialize(document, documentType, outputStream, UTF_8); //serialize the document, defaulting to UTF-8
	}

	/**
	 * Serializes the specified document to the given output stream using the specified encoding. Any byte order mark specified in the character encoding will be
	 * written to the stream based upon {@link #isBomWritten()}. A newline will be appended at the end if {@link #isFormatted()} is turned on and
	 * {@link #isFormatEndNewline()} is enabled.
	 * @param document The XML document to serialize.
	 * @param outputStream The stream into which the document should be serialized.
	 * @param charset The character set to use when serializing.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the specified encoding is not recognized.
	 */
	public void serialize(@Nonnull final Document document, @Nonnull final OutputStream outputStream, @Nonnull final Charset charset)
			throws IOException, UnsupportedEncodingException {
		serialize(document, document.getDoctype(), outputStream, charset);
	}

	/**
	 * Serializes the specified document to the given output stream using the specified encoding. Any byte order mark specified in the character encoding will be
	 * written to the stream based upon {@link #isBomWritten()}. A newline will be appended at the end if {@link #isFormatted()} is turned on and
	 * {@link #isFormatEndNewline()} is enabled.
	 * @apiNote This method replaces the given document's doctype altogether, even if null is indicated for both public and system identifiers.
	 * @param document The XML document to serialize.
	 * @param publicId The external subset public identifier to use instead of that specified by the document, or null if none should be included.
	 * @param systemId The external subset system identifier to use instead of that specified by the document, or null if none should be included.
	 * @param outputStream The stream into which the document should be serialized.
	 * @param charset The character set to use when serializing.
	 * @throws IllegalArgumentException if a public ID was given with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the specified encoding is not recognized.
	 */
	public void serialize(@Nonnull final Document document, @Nullable final String publicId, @Nullable final String systemId,
			@Nonnull final OutputStream outputStream, @Nonnull final Charset charset) throws IOException, UnsupportedEncodingException {
		checkArgument(!(publicId != null && systemId == null), "A system ID must be given with public ID `%s`.", publicId);
		serialize(document, document.getImplementation().createDocumentType(document.getDocumentElement().getNodeName(), publicId, systemId), outputStream,
				charset);
	}

	/**
	 * Serializes the specified document to the given output stream using the specified encoding. Any byte order mark specified in the character encoding will be
	 * written to the stream based upon {@link #isBomWritten()}. A newline will be appended at the end if {@link #isFormatted()} is turned on and
	 * {@link #isFormatEndNewline()} is enabled.
	 * @param document The XML document to serialize.
	 * @param documentType The document type to use for the document, or null if no document type should be used.
	 * @param outputStream The stream into which the document should be serialized.
	 * @param charset The character set to use when serializing.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the specified encoding is not recognized.
	 */
	public void serialize(@Nonnull final Document document, @Nullable final DocumentType documentType, @Nonnull final OutputStream outputStream,
			@Nonnull final Charset charset) throws IOException, UnsupportedEncodingException {
		resetIndent();
		if(isBomWritten()) { //if we should write a BOM
			final ByteOrderMark bom = ByteOrderMark.forCharset(charset); //get the byte order mark, if there is one
			if(bom != null) {
				outputStream.write(bom.getBytes()); //write the byte order mark
			}
		}
		final BufferedWriter writer = new BufferedWriter(new OutputStreamWriter(outputStream, charset)); //create a new writer based on our encoding TODO see if the writer automatically writes the byte order mark already for non-UTF-8
		if(isPrologWritten()) {
			serializeProlog(writer, document, charset); //write the prolog
		}
		if(documentType != null) { //if there is a document type indicated
			initializeEntityLookup(documentType.getEntities()); //initialize the entity lookup based on the provided entities
			serialize(writer, documentType); //write the document type
		} else { //if there is no document type
			initializeEntityLookup(null); //always initialize the entity lookup, so that at least the five XML entities will be included in the table
		}
		serializeProcessingInstructions(writer, document); //write any processing instructions
		final Element documentElement = document.getDocumentElement(); //get the document element
		if(isNamespacesDeclarationsEnsured()) { //if we should ensure namespaces
			if(isNamespacesDocumentElementDeclarations()) { //if missing namespaces should be declared on the document element, process the entire document before writing
				ensureNamespaceDeclarations(documentElement, documentElement, true); //make sure all namespaces are declared that all elements need (i.e. deep), declaring any missing elements on the document element
			}
		}
		serialize(writer, documentElement); //write the document element and all elements below it
		if(isFormatted() && isFormatEndNewline()) {
			writer.append(getLineSeparator()); //newline
		}
		writer.flush(); //flush any data we've buffered
	}

	/**
	 * Serializes the specified document fragment to the given output stream using the UTF-8 encoding with the UTF-8 byte order mark.
	 * @param documentFragment The XML document fragment to serialize.
	 * @param outputStream The stream into which the document fragment should be serialized.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the UTF-8 encoding not recognized.
	 */
	public void serialize(@Nonnull final DocumentFragment documentFragment, @Nonnull final OutputStream outputStream)
			throws UnsupportedEncodingException, IOException {
		serialize(documentFragment, outputStream, UTF_8); //serialize the document, defaulting to UTF-8
	}

	/**
	 * Serializes the specified document fragment to the given output stream using the specified encoding. Any byte order mark specified in the character encoding
	 * will be written to the stream. A newline will be appended at the end if {@link #isFormatted()} is turned on and {@link #isFormatEndNewline()} is enabled.
	 * @param documentFragment The XML document fragment to serialize.
	 * @param outputStream The stream into which the document fragment should be serialized.
	 * @param charset The charset to use when serializing.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the specified encoding is not recognized.
	 */
	public void serialize(@Nonnull final DocumentFragment documentFragment, @Nonnull final OutputStream outputStream, @Nonnull final Charset charset)
			throws IOException, UnsupportedEncodingException {
		serializeContent(documentFragment, outputStream, charset); //serialize the content of the document fragment		
	}

	/**
	 * Serializes the specified element and its children to the given output stream using the UTF-8 encoding with the UTF-8 byte order mark.
	 * @param element The XML element to serialize.
	 * @param outputStream The stream into which the element should be serialized.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the UTF-8 encoding is not recognized.
	 */
	public void serialize(@Nonnull final Element element, @Nonnull final OutputStream outputStream) throws IOException, UnsupportedEncodingException {
		serialize(element, outputStream, UTF_8); //serialize the element using UTF-8
	}

	/**
	 * Serializes the specified element and its children to the given output stream using the specified encoding. Any byte order mark specified in the character
	 * encoding will be written to the stream. A newline will be appended at the end if {@link #isFormatted()} is turned on and {@link #isFormatEndNewline()} is
	 * enabled.
	 * @param element The XML element to serialize.
	 * @param outputStream The stream into which the element should be serialized.
	 * @param charset The charset to use when serializing.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the specified encoding is not recognized.
	 */
	public void serialize(@Nonnull final Element element, @Nonnull final OutputStream outputStream, @Nonnull final Charset charset)
			throws IOException, UnsupportedEncodingException {
		resetIndent();
		if(isBomWritten()) { //if we should write a BOM
			final ByteOrderMark bom = ByteOrderMark.forCharset(charset); //get the byte order mark, if there is one
			if(bom != null) {
				outputStream.write(bom.getBytes()); //write the byte order mark
			}
		}
		final BufferedWriter writer = new BufferedWriter(new OutputStreamWriter(outputStream, charset)); //create a new writer based on our encoding TODO see if the writer automatically writes the byte order mark already for non-UTF-8
		serialize(writer, element); //write the element and all elements below it
		if(isFormatted() && isFormatEndNewline()) {
			writer.append(getLineSeparator()); //newline
		}
		writer.flush(); //flush any data we've buffered
	}

	/**
	 * Serializes the content (all child nodes and their descendants) of a specified node to the given output stream using the UTF-8 encoding with the UTF-8 byte
	 * order mark. A newline will be appended at the end if {@link #isFormatted()} is turned on and {@link #isFormatEndNewline()} is enabled.
	 * @param node The XML node the content of which to serialize—usually an element or document fragment.
	 * @param outputStream The stream into which the element content should be serialized.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the UTF-8 encoding is not recognized.
	 */
	protected void serializeContent(@Nonnull final Node node, @Nonnull final OutputStream outputStream) throws IOException, UnsupportedEncodingException {
		serializeContent(node, outputStream, UTF_8); //serialize the content UTF-8
	}

	/**
	 * Serializes the content (all child nodes and their descendants) of a specified node to the given output stream using the specified encoding. Any byte order
	 * mark specified in the character encoding will be written to the stream. A newline will be appended at the end if {@link #isFormatted()} is turned on and
	 * {@link #isFormatEndNewline()} is enabled.
	 * @param node The XML node the content of which to serialize—usually an element or document fragment.
	 * @param outputStream The stream into which the element content should be serialized.
	 * @param charset The charset to use when serializing.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @throws UnsupportedEncodingException Thrown if the specified encoding is not recognized.
	 */
	protected void serializeContent(@Nonnull final Node node, @Nonnull final OutputStream outputStream, @Nonnull final Charset charset)
			throws IOException, UnsupportedEncodingException {
		resetIndent();
		if(isBomWritten()) { //if we should write a BOM
			final ByteOrderMark bom = ByteOrderMark.forCharset(charset); //get the byte order mark, if there is one
			if(bom != null) {
				outputStream.write(bom.getBytes()); //write the byte order mark
			}
		}
		final BufferedWriter writer = new BufferedWriter(new OutputStreamWriter(outputStream, charset)); //create a new writer based on our encoding TODO see if the writer automatically writes the byte order mark already for non-UTF-8
		serializeContent(writer, node); //write all children of the node
		if(isFormatted() && isFormatEndNewline()) {
			writer.append(getLineSeparator()); //newline
		}
		writer.flush(); //flush any data we've buffered
	}

	/**
	 * Initializes the internal entity lookup with the entities defined in the specified map. The given entities will only be placed in the lookup table if the
	 * "useDefinedEntities" option is turned on, and then only entities which represent one-character entities will be used.
	 * @param entityMap The entity map which contains the entities to be placed in the internal lookup table, or null if entities are not available,
	 *          in which case only the default XML entities will be used.
	 * @throws IllegalArgumentException if a predefined entity was overridden using a different value.
	 * @see #isUseDefinedEntities()
	 * @see #setUseDefinedEntities(boolean)
	 */
	protected void initializeEntityLookup(@Nonnull final NamedNodeMap entityMap) {
		final List entityNameList = new ArrayList(); //create an array to hold the entity names we use
		final StringBuilder entityCharacterValueStringBuilder = new StringBuilder(); //create a buffer to hold all the character values
		if(isUseDefinedEntities()) { //if we were asked to use their entities
			if(entityMap != null) { //if we were provided a valid entity map
				final int entityCount = entityMap.getLength(); //find out how many entities there are
				for(int i = 0; i < entityCount; ++i) { //look at each of the entities
					final Entity entity = (Entity)entityMap.item(i); //get a reference to this entity
					final int entityChildCount = entity.getChildNodes().getLength(); //see how many children this entity has (entities store text content in child text nodes not in the entity value)
					if(entityChildCount == 1) { //if there is only one child node
						final Node entityChildNode = entity.getFirstChild(); //get a reference to the first child of the entity
						if(entityChildNode.getNodeType() == Node.TEXT_NODE) { //if this is a text node
							final String entityValue = ((Text)entityChildNode).getData(); //get the data of the node, which represents the replacement value of the entity
							if(entityValue.length() == 1) { //if this entity represents exactly one character
								final char c = entityValue.charAt(0);
								final String entityName = entity.getNodeName();
								//if they defined a predefined entity, make sure they didn't redefine it to something else
								checkArgument(!PREDEFINED_ENTITY_CHARACTERS.contains(c) || getPredefinedEntityName(c).equals(entityName));
								entityNameList.add(entityName); //add the entity's name to the list
								entityCharacterValueStringBuilder.append(c); //add the one-character value to the value buffer
							}
						}
					}
				}
			}
		}
		entityNames = entityNameList.toArray(new String[entityNameList.size()]); //convert the entities in the list to an array
		entityCharacterValues = entityCharacterValueStringBuilder.toString(); //convert the values into one searchable string
	}

	/**
	 * Serializes the specified documents to the given appendable.
	 * @param appendable The destination into which the prolog should be written.
	 * @param document The XML document the prolog of which to serialize.
	 * @param charset The charset in use.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serializeProlog(@Nonnull final Appendable appendable, @Nonnull final Document document, @Nonnull final Charset charset)
			throws IOException {
		appendable.append(XML_DECL_START).append(SPACE_CHAR).append(VERSIONINFO_NAME).append(EQUAL_CHAR).append(DOUBLE_QUOTE_CHAR).append(XML_VERSION)
				.append(DOUBLE_QUOTE_CHAR).append(SPACE_CHAR).append(ENCODINGDECL_NAME).append(EQUAL_CHAR).append(DOUBLE_QUOTE_CHAR).append(charset.name())
				.append(DOUBLE_QUOTE_CHAR).append(XML_DECL_END); //write the XML prolog
		if(isFormatted()) { //if we should write formatted output
			appendable.append(getLineSeparator()); //newline
		}
		return appendable;
	}

	/**
	 * Serializes the document's processing instructions to the given appendable.
	 * @param appendable The destination into which the processing instructions should be written.
	 * @param document The XML document the processing instructions of which to serialize.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serializeProcessingInstructions(@Nonnull final Appendable appendable, @Nonnull final Document document) throws IOException {
		final NodeList childNodeList = document.getChildNodes(); //get the list of document child nodes
		final int childNodeCount = childNodeList.getLength(); //find out how many document child nodes there are
		for(int childIndex = 0; childIndex < childNodeCount; childIndex++) { //look at each document child node
			final Node node = childNodeList.item(childIndex); //look at this document child node
			if(node.getNodeType() == Node.PROCESSING_INSTRUCTION_NODE) //if this is a processing instruction
				serialize(appendable, (ProcessingInstruction)node); //write the processing instruction node
		}
		return appendable;
	}

	/**
	 * Serializes the document type to the given appendable.
	 * @param appendable The destination into which the document type should be written.
	 * @param documentType The XML document type to serialize.
	 * @return The given appendable.
	 * @throws IllegalArgumentException if the document type has a public ID with no system ID.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serialize(@Nonnull final Appendable appendable, @Nonnull final DocumentType documentType) throws IOException {
		final String publicID = documentType.getPublicId(); //get the public ID, if there is one
		final String systemID = documentType.getSystemId(); //get the system ID, if there is one 
		checkArgument(!(publicID != null && systemID == null), "A system ID must be given with public ID `%s`.", publicID);
		appendable.append(DOCTYPE_DECL_START).append(SPACE_CHAR).append(documentType.getName()); //write the beginning of the document type declaration
		if(publicID != null || systemID != null) { //if there is a public ID or a system ID
			appendable.append(SPACE_CHAR); //separate the identifiers from the doctype introduction
			if(publicID != null) { //if there is a public ID
				appendable.append(PUBLIC_ID_NAME).append(SPACE_CHAR).append(DOUBLE_QUOTE_CHAR).append(publicID).append(DOUBLE_QUOTE_CHAR).append(SPACE_CHAR); //write the public ID name and its public literal
			} else { //if there is no public ID
				appendable.append(SYSTEM_ID_NAME).append(SPACE_CHAR); //write the system ID name
			}
			appendable.append(DOUBLE_QUOTE_CHAR).append(documentType.getSystemId()).append(DOUBLE_QUOTE_CHAR); //always write the system literal
		}
		appendable.append(DOCTYPE_DECL_END); //write the end of the document type declaration
		if(isFormatted()) { //if we should write formatted output
			appendable.append(getLineSeparator()); //newline
		}
		return appendable;
	}

	/**
	 * Serializes the given processing instruction to the given appendable.
	 * @param appendable The destination into which the processing instruction should be written.
	 * @param processingInstruction The XML processing instruction to serialize.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serialize(@Nonnull final Appendable appendable, @Nonnull final ProcessingInstruction processingInstruction) throws IOException {
		//write the beginning of the processing instruction: "isContentFormatted.
	 * @param appendable The destination into which the element should be written.
	 * @param element The XML element to serialize.
	 * @param isContentFormatted Whether this element's contents, including any child nodes, should be formatted.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serialize(@Nonnull final Appendable appendable, @Nonnull final Element element, @Nonnull boolean isContentFormatted) throws IOException {
		appendable.append(TAG_START).append(element.getNodeName()); //write the beginning of the start tag
		if(isNamespacesDeclarationsEnsured()) { //if we should ensure namespaces
			ensureNamespaceDeclarations(element, null, false); //make sure all namespaces are declared that just this element needs; if any are missing, we can't declare up the tree, as those nodes have already been serialized
		}
		/*TODO fix; this correctly doesn't add namespaces, to the tree itself, but not doing so means that the namespaces will just get added again lower down in the hierarchy
					//get the undeclared namespaces for this element and write them before the normal attributes are written
				final NameValuePair[] prefixNamespacePairs=XMLNamespaceProcessor.getUndeclaredNamespaces(element);
				for(int i=0; i
			appendable.append(SPACE_CHAR).append(END_TAG_IDENTIFIER_CHAR).append(TAG_END); //write the end of the empty element tag, with an extra space for HTML browser compatibility
		} else {
			appendable.append(TAG_END); //write the end of the start tag
			final boolean isChildContentFormatted = isContentFormatted && !getFormatProfile().isPreserved(element); //override formatting for preserved elements
			serializeContent(appendable, element, isChildContentFormatted);
			appendable.append(TAG_START).append(END_TAG_IDENTIFIER_CHAR).append(element.getNodeName()).append(TAG_END); //write the ending tag
		}
		return appendable;
	}

	/**
	 * A comparator for ordering namespace-declaring attributes specially.
	 * 
	 * The {@link XML#ATTRIBUTE_XMLNS} attribute is sorted first.
	 * Any attribute with the {@value XML#XMLNS_NAMESPACE_PREFIX} prefix is sorted based upon the case-insensitive local name (xmlns:first,
	 * xmlns:second) and placed before any other prefixed attributes, but not before non-prefixed attributes.
	 * 
	 * @implNote {@link String#CASE_INSENSITIVE_ORDER} is used for comparison, which may not properly sort all languages but will produce desirable results for
	 *           virtually all attributes in use in the real world.
	 */
	private final static Comparator XMLNS_ATTR_NAME_COMPARATOR = new Comparator() {

		@Override
		public int compare(final Attr attr1, final Attr attr2) {
			final String attr1Name = attr1.getName();
			final String attr2Name = attr2.getName();

			//`xmlns`
			if(ATTRIBUTE_XMLNS.getLocalName().equals(attr1Name)) {
				if(ATTRIBUTE_XMLNS.getLocalName().equals(attr2Name)) {
					return 0; //both are `xmlns`
				} else {
					return -1; //only the first is `xmln`
				}
			} else if(ATTRIBUTE_XMLNS.getLocalName().equals(attr2Name)) {
				assert !ATTRIBUTE_XMLNS.getLocalName().equals(attr1Name);
				return 1; //only the second is `xmlns`
			}

			//`xmlns:foo`
			final String attr1Prefix = attr1.getPrefix();
			final String attr2Prefix = attr2.getPrefix();
			if(attr1Prefix != null && attr2Prefix != null) { //sort the namespace declarations but do _not_ place them before non-prefixed attributes
				if(XMLNS_NAMESPACE_PREFIX.equals(attr1Prefix)) {
					if(XMLNS_NAMESPACE_PREFIX.equals(attr2Prefix)) {
						return CASE_INSENSITIVE_ORDER.compare(attr1.getLocalName(), attr2.getLocalName()); //both are `xmlns:foo`; sort by local name
					} else {
						return -1; //only the first is `xmlns:foo`
					}
				} else if(XMLNS_NAMESPACE_PREFIX.equals(attr2Prefix)) {
					return 1; //only the second is `xmlns:foo`
				}
			}

			return 0; //any other combination is "equal" for the purposes of this comparator
		}
	};

	/**
	 * A general comparator for ordering attributes by name.
	 * 
	 * Names with no prefix are sorted first (e.g. bar, foo:bar).
	 * Names are then sorted by prefix in a case-insensitive order (e.g. foo:bar, other:att).
	 * Names are then sorted by local name in a case-insensitive order (e.g. foo:first, foo:second).
	 * 
	 * @implNote {@link String#CASE_INSENSITIVE_ORDER} is used for comparison, which may not properly sort all languages but will produce desirable results for
	 *           virtually all attributes in use in the real world.
	 */
	private final static Comparator ATTR_NAME_COMPARATOR = comparing(Attr::getPrefix, nullsFirst(CASE_INSENSITIVE_ORDER))
			.thenComparing(attr -> attr.getLocalName(), CASE_INSENSITIVE_ORDER);

	/**
	 * Serializes the attributes of the specified element to the given appendable.
	 * @apiNote The given attributes may not necessarily be exactly the attributes that would be retrieved directly from the element.
	 * @implSpec This implementation sorts attributes in the following order:
	 *           
	 *           The {@link XML#ATTRIBUTE_XMLNS} attribute is sorted first.
	 *           Any attribute with the {@value XML#XMLNS_NAMESPACE_PREFIX} prefix is sorted based upon the case-insensitive local name
	 *           (xmlns:first, xmlns:second) and placed before any other prefixed attributes, but not before non-prefixed
	 *           attributes.
	 *           Attributes are then ordered by {@link XmlFormatProfile#getAttributeOrder(Element)}.
	 *           Names with no prefix are sorted next (e.g. bar, foo:bar).
	 *           Names are then sorted by prefix in a case-insensitive order (e.g. foo:bar, other:att).
	 *           Names are then sorted by local name in a case-insensitive order (e.g. foo:first, foo:second).
	 *           
	 * @param appendable The destination into which the attributes should be written.
	 * @param element The XML element the attributes of which to serialize.
	 * @param attributes The actual attributes to serialize.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 * @see #XMLNS_ATTR_NAME_COMPARATOR
	 * @see #ATTR_NAME_COMPARATOR
	 */
	protected Appendable serializeAttributes(@Nonnull final Appendable appendable, @Nonnull final Element element, @Nonnull Stream attributes)
			throws IOException {
		//1. `xmlns` related attributes come first.
		Comparator comparator = XMLNS_ATTR_NAME_COMPARATOR;
		//2. Explicitly ordered attributes come next.
		final List order = getFormatProfile().getAttributeOrder(element);
		if(!order.isEmpty()) { //if we have a preferred order, use that order, placing explicitly ordered attributes first
			comparator = comparator.thenComparing(NsName::ofNode, explicitOrderFirst(order));
		}
		//3. Finally order the rest of the attributes in alphabetical order.
		comparator = comparator.thenComparing(ATTR_NAME_COMPARATOR);
		for(final Attr attribute : (Iterable)attributes.sorted(comparator)::iterator) {
			serializeAttribute(appendable, element, attribute); //write this attribute
		}
		return appendable;
	}

	/**
	 * Indicates whether the given element should be serialized as an empty element tag.
	 * @implSpec The default implementation returns false if the given element has any children.
	 * @param element The element being serialized.
	 * @return true if the XML empty-element tag form should be used to serialize the tag.
	 * @see Extensible Markup Language (XML) 1.0 (Fifth Edition) § 3.1 Start-Tags, End-Tags, and Empty-Element
	 *      Tags
	 */
	protected boolean isEmptyElementTag(@Nonnull final Element element) {
		return element.getChildNodes().getLength() == 0;
	}

	/**
	 * Serializes the specified element attribute to the given appendable.
	 * @implSpec This implementation delegates to {@link #serializeAttribute(Appendable, String, String)}.
	 * @implNote A subclass that overrides this method should normally call this version or manually delegate to
	 *           {@link #serializeAttribute(Appendable, String, String)} as appropriate.
	 * @param appendable The destination into which the attribute should be written.
	 * @param element The XML element the attribute of which to serialize.
	 * @param attribute The attribute to serialize.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serializeAttribute(@Nonnull final Appendable appendable, @Nonnull final Element element, @Nonnull final Attr attribute)
			throws IOException {
		return serializeAttribute(appendable, attribute.getName(), attribute.getValue());
	}

	/**
	 * Serializes the specified attribute name and value to the given appendable.
	 * @param appendable The destination into which the attribute should be written.
	 * @param attributeName The name of the XML attribute to serialize.
	 * @param attributeValue The name of the XML attribute to serialize.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serializeAttribute(@Nonnull final Appendable appendable, @Nonnull final String attributeName, @Nonnull final String attributeValue)
			throws IOException {
		//use a double quote character as a delimiter unless the value contains
		//  a double quote; in that case, use a single quote TODO fix escaping---what if both double and single quotes are used?
		final char valueDelimiter = attributeValue.indexOf(DOUBLE_QUOTE_CHAR) < 0 ? DOUBLE_QUOTE_CHAR : SINGLE_QUOTE_CHAR;
		//write the attribute and its value after encoding it for XML; pass the delimiter in case this value has both a single and a double quote
		appendable.append(SPACE_CHAR).append(attributeName).append(EQUAL_CHAR).append(valueDelimiter);
		encodeContent(appendable, attributeValue, valueDelimiter);
		appendable.append(valueDelimiter);
		return appendable;
	}

	/**
	 * Serializes the content of the specified node to the given appendable using the default formatting options.
	 * @param appendable The destination into which the element content should be written.
	 * @param node The XML node the content of which to serialize—usually an element or document fragment.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serializeContent(@Nonnull final Appendable appendable, @Nonnull final Node node) throws IOException {
		return serializeContent(appendable, node, isFormatted()); //write the content using the default formatting options
	}

	/**
	 * The string form of the character to which any line break sequence is normalized during XML processing.
	 * @see Extensible Markup Language (XML) 1.0 (Fifth Edition), § 2.11 End-of-Line Handling
	 * @see XML#NORMALIZED_LINE_BREAK_CHAR
	 */
	private static final String NORMALIZED_LINE_BREAK_STRING = String.valueOf(NORMALIZED_LINE_BREAK_CHAR);

	/**
	 * Serializes the content of the specified node to the given appendable.
	 * 
	 * If formatting is enabled, child text content is normalized in the following manner:
	 * 
	 * 
	 * Subsequent text nodes are combined.
	 * Text space runs of {@link XmlFormatProfile#getSpaceNormalizationCharacters()} are normalized to a single space.
	 * Text is left trimmed if it is the first child of block content, or if it appears directly after a block element sibling or a break element
	 * sibling.
	 * Text is right trimmed if it is the last child of block content, or if it appears directly before a block element sibling.
	 * Any resulting empty string text nodes are ignored.
	 * 
	 * 
	 * If formatting is enabled, child nodes are formatted in the following way:
	 * 
	 * 
	 * A child element marked as {@link XmlFormatProfile#isBlock(Element)} have a line break appended before and after, and be indented.
	 * If a child node comes after a child causing a line break, it will be indented as well, whether it is a block element or not.
	 * 
If any child element was indented, the last child will have a line break appended after it.
	 * 
	 * @apiNote Attributes will always be formatted independent of the isContentFormatted.
	 * @apiNote End of line sequences will always be normalized to {@link #getLineSeparator()} even if isContentFormatted is disabled.
	 * @implNote The current implementation assumes that all newlines in preserved content have been normalized to {@link XML#NORMALIZED_LINE_BREAK_CHAR} as if
	 *           parsed using an XML processor. If a DOM tree is constructed manually with different non-normalized line endings, they may not get converted to
	 *           the currently set line separated.
	 * @param appendable The destination into which the element content should be written.
	 * @param node The XML node the content of which to serialize—usually an element or document fragment.
	 * @param isContentFormatted Whether the contents of this node, including any child nodes, should be formatted.
	 * @return The given appendable.
	 * @throws IOException Thrown if an I/O error occurred.
	 */
	protected Appendable serializeContent(@Nonnull final Appendable appendable, @Nonnull final Node node, final boolean isContentFormatted) throws IOException {
		final XmlFormatProfile formatProfile = getFormatProfile();

		/*
		 * Whether content will always begin with a newline if there are any child block elements.
		 * This is a possible future configurable setting.
		 */
		//TODO enable in future: final boolean settingAlwaysBeginningNewlineIfAnyBlockChildren = false;

		/*
		 * Whether content will always end with a newline before closing tag if there were any block children.
		 * Put another way, this setting determines whether ending tags are always aligned with beginning tags, unless the only lines breaks are from break elements.
		 * This is a possible future configurable setting.
		 */
		final boolean settingAlwaysEndingNewlineIfAnyBlockChildren = true;

		//gather information about the parent node
		final boolean isBlockElement = node instanceof Element && formatProfile.isBlock(((Element)node));
		final boolean isFlushElement = node instanceof Element && formatProfile.isFlush(((Element)node));

		//1. preprocess children

		//1a. dereference text and combine text runs, using strings; use an array list for faster lookup later; all text will be of type `String`
		final List