org.apache.jackrabbit.commons.xml.ToXmlContentHandler Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.jackrabbit.commons.xml;
import java.io.IOException;
import java.io.OutputStream;
import java.io.OutputStreamWriter;
import java.io.StringWriter;
import java.io.UnsupportedEncodingException;
import java.io.Writer;
import org.xml.sax.Attributes;
import org.xml.sax.ContentHandler;
import org.xml.sax.SAXException;
import org.xml.sax.helpers.DefaultHandler;
/**
* Simple XML serializer. This content handler serializes the received
* SAX events as XML to a given {@link Writer} or {@link OutputStream}.
* The serialization assumes that the incoming SAX events are well-formed,
* i.e. that all elements are properly nested, that element and attribute
* names are valid and that no invalid XML characters are included. Assuming
* these preconditions are met, the result will be a well-formed XML stream.
*
* This serializer does not have any special support for namespaces. For
* example, namespace prefixes are declared in the resulting XML stream
* if and only if the corresponding "xmlns" attributes are explicitly
* included in the {@link Attributes} instances passed in
* {@link #startElement(String, String, String, Attributes)} calls.
*
* As a convenience this class inherits the {@link DefaultHandler} class
* instead of just the {@link ContentHandler} interface. This makes it
* easier to pass instances of this class to methods like
* {@link javax.xml.parsers.SAXParser#parse(String, DefaultHandler)} that
* expect a DefaultHandler instance instead of a ContentHandler.
*/
public class ToXmlContentHandler extends DefaultHandler {
/**
* The XML stream.
*/
private final Writer writer;
/**
* The data part of the <?xml?> processing instruction included
* at the beginning of the XML stream.
*/
private final String declaration;
/**
* Flag variable that is used to track whether a start tag has had it's
* closing ">" appended. Set to true
by the
* {@link #startElement(String, String, String, Attributes)} method that
* does not output the closing ">". If this flag is still set
* when the {#link {@link #endElement(String, String, String)}} method
* is called, then the method knows that the element is empty and can
* close it with "/>". Any other SAX event will cause the open start tag
* to be closed with a normal ">".
*
* @see #closeStartTagIfOpen()
*/
private boolean startTagIsOpen = false;
//--------------------------------------------------------< constructors >
/**
* Creates an XML serializer that writes the serialized XML stream
* to the given output stream using the given character encoding.
*
* @param stream XML output stream
* @param encoding character encoding
* @throws UnsupportedEncodingException if the encoding is not supported
*/
public ToXmlContentHandler(OutputStream stream, String encoding)
throws UnsupportedEncodingException {
this.writer = new OutputStreamWriter(stream, encoding);
this.declaration = "version=\"1.0\" encoding=\"" + encoding + "\"";
}
/**
* Creates an XML serializer that writes the serialized XML stream
* to the given output stream using the UTF-8 character encoding.
*
* @param stream XML output stream
*/
public ToXmlContentHandler(OutputStream stream) {
try {
this.writer = new OutputStreamWriter(stream, "UTF-8");
this.declaration = "version=\"1.0\" encoding=\"UTF-8\"";
} catch (UnsupportedEncodingException e) {
// should never happen
throw new IllegalStateException("UTF-8 is not supported!");
}
}
/**
* Creates an XML serializer that writes the serialized XML stream
* to the given writer.
*
* @param writer XML output stream
*/
public ToXmlContentHandler(Writer writer) {
this.writer = writer;
this.declaration = "version=\"1.0\"";
}
/**
* Creates an XML serializer that writes the serialized XML stream
* to an internal buffer. Use the {@link #toString()} method to access
* the serialized XML document.
*/
public ToXmlContentHandler() {
this(new StringWriter());
}
//-------------------------------------------------------------< private >
private void write(char[] ch, int start, int length, boolean attribute)
throws SAXException {
for (int i = start; i < start + length; i++) {
try {
if (ch[i] == '>') {
writer.write(">");
} else if (ch[i] == '<') {
writer.write("<");
} else if (ch[i] == '&') {
writer.write("&");
} else if (attribute && ch[i] == '"') {
writer.write(""");
} else if (attribute && ch[i] == '\'') {
writer.write("'");
} else {
writer.write(ch[i]);
}
} catch (IOException e) {
throw new SAXException(
"Failed to output XML character: " + ch[i], e);
}
}
}
private void closeStartTagIfOpen() throws SAXException {
if (startTagIsOpen) {
try {
writer.write(">");
} catch (IOException e) {
throw new SAXException(
"Failed to output XML bracket: >", e);
}
startTagIsOpen = false;
}
}
//------------------------------------------------------< ContentHandler >
/**
* Starts the XML serialization by outputting the <?xml?> header.
*/
public void startDocument() throws SAXException {
processingInstruction("xml", declaration);
}
/**
* Ends the XML serialization by flushing the output stream.
*/
public void endDocument() throws SAXException {
try {
writer.flush();
} catch (IOException e) {
throw new SAXException("Failed to flush XML output", e);
}
}
/**
* Serializes a processing instruction.
*/
public void processingInstruction(String target, String data)
throws SAXException {
closeStartTagIfOpen();
try {
writer.write("");
writer.write(target);
if (data != null) {
writer.write(" ");
writer.write(data);
}
writer.write("?>");
} catch (IOException e) {
throw new SAXException(
"Failed to output XML processing instruction: " + target, e);
}
}
/**
* Outputs the specified start tag with the given attributes.
*/
public void startElement(
String namespaceURI, String localName, String qName,
Attributes atts) throws SAXException {
closeStartTagIfOpen();
try {
writer.write("<");
writer.write(qName);
for (int i = 0; i < atts.getLength(); i++) {
writer.write(" ");
writer.write(atts.getQName(i));
writer.write("=\"");
char[] ch = atts.getValue(i).toCharArray();
write(ch, 0, ch.length, true);
writer.write("\"");
}
startTagIsOpen = true;
} catch (IOException e) {
throw new SAXException(
"Failed to output XML end tag: " + qName, e);
}
}
/**
* Escapes and outputs the given characters.
*/
public void characters(char[] ch, int start, int length)
throws SAXException {
closeStartTagIfOpen();
write(ch, start, length, false);
}
/**
* Escapes and outputs the given characters.
*/
public void ignorableWhitespace(char[] ch, int start, int length)
throws SAXException {
characters(ch, start, length);
}
/**
* Outputs the specified end tag.
*/
public void endElement(
String namespaceURI, String localName, String qName)
throws SAXException {
try {
if (startTagIsOpen) {
writer.write("/>");
startTagIsOpen = false;
} else {
writer.write("");
writer.write(qName);
writer.write(">");
}
} catch (IOException e) {
throw new SAXException(
"Failed to output XML end tag: " + qName, e);
}
}
//--------------------------------------------------------------< Object >
/**
* Returns the serialized XML document (assuming the default no-argument
* constructor was used).
*
* @return serialized XML document
*/
public String toString() {
return writer.toString();
}
}