net.sf.saxon.event.CommentStripper Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of saxon-he Show documentation
Show all versions of saxon-he Show documentation
An OSGi bundle for Saxon-HE
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2013 Saxonica Limited.
// This Source Code Form is subject to the terms of the Mozilla Public License, v. 2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
// This Source Code Form is "Incompatible With Secondary Licenses", as defined by the Mozilla Public License, v. 2.0.
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
package net.sf.saxon.event;
import net.sf.saxon.om.NodeName;
import net.sf.saxon.trans.XPathException;
import net.sf.saxon.tree.tiny.CompressedWhitespace;
import net.sf.saxon.tree.util.FastStringBuffer;
import net.sf.saxon.type.SchemaType;
/**
* The CommentStripper class is a filter that removes all comments and processing instructions.
* It also concatenates text nodes that are split by comments and PIs. This follows the rules for
* processing stylesheets; it is also used for removing comments and PIs from the tree seen
* by XPath expressions used to process XSD 1.1 assertions
* @author Michael H. Kay
*/
public class CommentStripper extends ProxyReceiver {
/*@Nullable*/ private CompressedWhitespace savedWhitespace = null;
private FastStringBuffer buffer = new FastStringBuffer(FastStringBuffer.MEDIUM);
/**
* Default constructor for use in subclasses
* @param next the next receiver in the pipeline
*/
public CommentStripper(Receiver next) {
super(next);
}
public void startElement (NodeName nameCode, SchemaType typeCode, int locationId, int properties)
throws XPathException {
flush();
nextReceiver.startElement(nameCode, typeCode, locationId, properties);
}
/**
* Callback interface for SAX: not for application use
*/
public void endElement () throws XPathException {
flush();
nextReceiver.endElement();
}
/**
* Handle a text node. Because we're often handling stylesheets on this path, whitespace text
* nodes will often be stripped but we can't strip them immediately because of the case
* [element] [!-- comment --]text[/element], where the space before the comment is considered
* significant. But it's worth going to some effort to avoid uncompressing the whitespace in the
* more common case, so that it can easily be detected and stripped downstream.
*/
public void characters (CharSequence chars, int locationId, int properties) throws XPathException {
if (chars instanceof CompressedWhitespace) {
if (buffer.length() == 0 && savedWhitespace == null) {
savedWhitespace = (CompressedWhitespace)chars;
} else {
((CompressedWhitespace)chars).uncompress(buffer);
}
} else {
if (savedWhitespace != null) {
savedWhitespace.uncompress(buffer);
savedWhitespace = null;
}
buffer.append(chars);
}
}
/**
* Remove comments
*/
public void comment (CharSequence chars, int locationId, int properties) {}
/**
* Remove processing instructions
*/
public void processingInstruction(String name, CharSequence data, int locationId, int properties) {}
/**
* Flush the character buffer
* @throws net.sf.saxon.trans.XPathException if a failure occurs writing the output
*/
private void flush() throws XPathException {
if (buffer.length() > 0) {
nextReceiver.characters(buffer, 0, 0);
} else if (savedWhitespace != null) {
nextReceiver.characters(savedWhitespace, 0, 0);
}
savedWhitespace = null;
buffer.setLength(0);
}
}