net.sf.saxon.resource.ActiveSAXSource Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of Saxon-HE Show documentation
Show all versions of Saxon-HE Show documentation
The XSLT and XQuery Processor
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2018-2022 Saxonica Limited
// This Source Code Form is subject to the terms of the Mozilla Public License, v. 2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
// This Source Code Form is "Incompatible With Secondary Licenses", as defined by the Mozilla Public License, v. 2.0.
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
package net.sf.saxon.resource;
import net.sf.saxon.Configuration;
import net.sf.saxon.event.Receiver;
import net.sf.saxon.event.ReceivingContentHandler;
import net.sf.saxon.expr.number.Numberer_en;
import net.sf.saxon.lib.*;
import net.sf.saxon.trans.SaxonErrorCode;
import net.sf.saxon.trans.UncheckedXPathException;
import net.sf.saxon.trans.XPathException;
import org.xml.sax.*;
import javax.xml.transform.sax.SAXSource;
import java.util.Map;
import java.util.function.Consumer;
/**
* This class extends the standard SAXSource class by providing a {@link #deliver(Receiver, ParseOptions)}
* method, meaning that Saxon can treat it just like any other {@link ActiveSource} implementation.
*
* This makes it easier to extract code from the product that's specific to the Java platform
* (in particular, support for SAX APIs).
*/
public class ActiveSAXSource extends SAXSource implements ActiveSource {
Consumer parserPool;
public ActiveSAXSource(XMLReader parser, InputSource source) {
super(parser, source);
}
/**
* Construct an ActiveSAXSource from a SAXSource
* @param source the input source object, whose properties are copied. The source must
* include a non-null XMLReader.
*/
public ActiveSAXSource(SAXSource source) throws IllegalArgumentException, XPathException {
if (source.getXMLReader() == null) {
throw new IllegalArgumentException("Supplied SAXSource contains no XMLReader");
}
setInputSource(source.getInputSource());
setXMLReader((source.getXMLReader()));
setSystemId(source.getSystemId());
}
public ActiveSAXSource(InputSource inputSource, Configuration config) {
setInputSource(inputSource);
setXMLReader(config.getSourceParser());
setSystemId(inputSource.getSystemId());
}
/**
* Supply a mechanism to recycle the XMLReader after use
* @param parserPool a place to return the parser after parsing is complete
*/
public void setParserPool(Consumer parserPool) {
this.parserPool = parserPool;
}
@Override
public void deliver(Receiver receiver, ParseOptions options) throws XPathException {
try {
Logger logger = receiver.getPipelineConfiguration().getConfiguration().getLogger();
XMLReader parser = getXMLReader();
//System.err.println("Using parser " + parser.getClass());
configureParser(parser); // Bug 5276
ReceivingContentHandler rch = new ReceivingContentHandler();
rch.setReceiver(receiver);
rch.setPipelineConfiguration(receiver.getPipelineConfiguration());
parser.setContentHandler(rch);
parser.setDTDHandler(rch);
parser.setProperty("http://xml.org/sax/properties/lexical-handler", rch);
ErrorHandler errorHandler = parser.getErrorHandler();
if (errorHandler == null) {
errorHandler = options.getErrorHandler();
if (errorHandler == null) {
if (options.getErrorReporter() != null) {
errorHandler = new StandardErrorHandler(options.getErrorReporter());
} else {
errorHandler = new StandardErrorHandler(receiver.getPipelineConfiguration().getConfiguration().makeErrorReporter());
}
}
parser.setErrorHandler(errorHandler);
}
if (!options.isExpandAttributeDefaults()) {
try {
parser.setFeature("http://xml.org/sax/features/use-attributes2", true);
} catch (SAXNotRecognizedException | SAXNotSupportedException err) {
// ignore the failure, we did our best (Xerces gives us an Attribute2 even though it
// doesn't recognize this request!)
}
}
boolean dtdRecover = options.getDTDValidationMode() == Validation.LAX;
Map parserFeatures = options.getParserFeatures();
Map parserProperties = options.getParserProperties();
if (parserFeatures != null) {
for (Map.Entry entry : parserFeatures.entrySet()) {
try {
String name = entry.getKey();
boolean value = entry.getValue();
if (name.equals("http://apache.org/xml/features/xinclude")) {
boolean tryAgain = false;
try {
// This feature name is supported in Xerces 2.9.0
parser.setFeature(name, value);
} catch (SAXNotRecognizedException | SAXNotSupportedException err) {
tryAgain = true;
}
if (tryAgain) {
try {
// This feature name is supported in the version of Xerces bundled with JDK 1.5
parser.setFeature(name + "-aware", value);
} catch (SAXNotRecognizedException err) {
throw new XPathException(namedParser(parser) +
" does not recognize request for XInclude processing", err);
} catch (SAXNotSupportedException err) {
throw new XPathException(namedParser(parser) +
" does not support XInclude processing", err);
}
}
} else {
parser.setFeature(name, value);
}
} catch (SAXNotRecognizedException err) {
// No warning if switching a feature off doesn't work: bugs 2540 and 2551
if (entry.getValue()) {
logger.warning(namedParser(parser) + " does not recognize the feature " + entry.getKey());
}
} catch (SAXNotSupportedException err) {
if (entry.getValue()) {
logger.warning(namedParser(parser) + " does not support the feature " + entry.getKey());
}
}
}
}
if (parserProperties != null) {
for (Map.Entry entry : parserProperties.entrySet()) {
try {
parser.setProperty(entry.getKey(), entry.getValue());
} catch (SAXNotRecognizedException err) {
logger.warning(namedParser(parser) + " does not recognize the property " + entry.getKey());
} catch (SAXNotSupportedException err) {
logger.warning(namedParser(parser) + " does not support the property " + entry.getKey());
}
}
}
boolean xInclude = options.isXIncludeAware();
if (xInclude) {
boolean tryAgain = false;
try {
// This feature name is supported in the version of Xerces bundled with JDK 1.5
parser.setFeature("http://apache.org/xml/features/xinclude-aware", true);
} catch (SAXNotRecognizedException | SAXNotSupportedException err) {
tryAgain = true;
}
if (tryAgain) {
try {
// This feature name is supported in Xerces 2.9.0
parser.setFeature("http://apache.org/xml/features/xinclude", true);
} catch (SAXNotRecognizedException err) {
throw new XPathException(namedParser(parser) +
" does not recognize request for XInclude processing", err);
} catch (SAXNotSupportedException err) {
throw new XPathException(namedParser(parser) +
" does not support XInclude processing", err);
}
}
}
//System.err.println("Parse " + getSystemId());
///////////////////////////////
parser.parse(getInputSource());
///////////////////////////////
if (errorHandler instanceof StandardErrorHandler) {
int errs = ((StandardErrorHandler) errorHandler).getFatalErrorCount();
if (errs > 0) {
throw new XPathException("The XML parser reported " + errs + (errs == 1 ? " error" : " errors"));
}
errs = ((StandardErrorHandler) errorHandler).getErrorCount();
if (errs > 0) {
String message = "The XML parser reported " + new Numberer_en().toWords(errs).toLowerCase() +
" validation error" + (errs == 1 ? "" : "s");
if (dtdRecover) {
message += ". Processing continues, because recovery from validation errors was requested";
logger.warning(message);
} else {
throw new XPathException(message);
}
}
}
if (parserPool != null) {
parserPool.accept(getXMLReader());
}
} catch (XPathException xpe) {
throw xpe;
} catch (UncheckedXPathException uxpe) {
throw new XPathException(uxpe);
} catch (SAXException err) {
Exception nested = err.getException();
if (nested instanceof XPathException) {
throw (XPathException) nested;
} else if (nested instanceof RuntimeException) {
throw (RuntimeException) nested;
} else {
XPathException de = new XPathException(err);
de.setErrorCode(SaxonErrorCode.SXXP0003);
de.setHasBeenReported(true);
throw de;
}
} catch (java.io.IOException err) {
throw new XPathException("I/O error reported by XML parser processing " +
getSystemId() + ": " + err.getMessage(), err);
} catch (Exception x) {
x.printStackTrace();
throw new IllegalStateException();
}
}
// Commented out code is the old code from Sender.java. Perhaps we need to retain more of this
// logic in the deliver() method?
// /**
// * Send the contents of a SAXSource to a given Receiver
// *
// * @param source the SAXSource
// * @param receiver the destination Receiver
// * @param options options for parsing the SAXSource
// * @throws XPathException if any failure occurs processing the Source object
// */
//
// private static void sendSAXSource(SAXSource source, Receiver receiver, ParseOptions options)
// throws XPathException {
// PipelineConfiguration pipe = receiver.getPipelineConfiguration();
// XMLReader parser = source.getXMLReader();
// boolean reuseParser = false;
// final Configuration config = pipe.getConfiguration();
// ErrorReporter listener = options.getErrorReporter();
// if (listener == null) {
// listener = pipe.getErrorReporter();
// }
// ErrorHandler errorHandler = options.getErrorHandler();
// if (errorHandler == null) {
// errorHandler = new StandardErrorHandler(listener);
// }
// if (parser == null) {
// parser = options.obtainXMLReader();
// }
// if (parser == null) {
// SAXSource ss = new SAXSource();
// ss.setInputSource(source.getInputSource());
// ss.setSystemId(source.getSystemId());
// parser = config.getSourceParser();
// parser.setErrorHandler(errorHandler);
// if (options.getEntityResolver() != null && parser.getEntityResolver() == null) {
// parser.setEntityResolver(options.getEntityResolver());
// }
// ss.setXMLReader(parser);
// source = ss;
// reuseParser = true;
// } else {
// // user-supplied parser: ensure that it meets the namespace requirements
// configureParser(parser);
// if (parser.getErrorHandler() == null) {
// parser.setErrorHandler(errorHandler);
// }
// }
//
// if (!pipe.getParseOptions().isExpandAttributeDefaults()) {
// try {
// parser.setFeature("http://xml.org/sax/features/use-attributes2", true);
// } catch (SAXNotRecognizedException | SAXNotSupportedException err) {
// // ignore the failure, we did our best (Xerces gives us an Attribute2 even though it
// // doesn't recognize this request!)
// }
// }
//
// boolean dtdRecover = options.getDTDValidationMode() == Validation.LAX;
//
// Map parserFeatures = options.getParserFeatures();
// Map parserProperties = options.getParserProperties();
//
// if (parserFeatures != null) {
// for (Map.Entry entry : parserFeatures.entrySet()) {
// try {
// String name = entry.getKey();
// boolean value = entry.getValue();
// if (name.equals("http://apache.org/xml/features/xinclude")) {
// boolean tryAgain = false;
// try {
// // This feature name is supported in Xerces 2.9.0
// parser.setFeature(name, value);
// } catch (SAXNotRecognizedException | SAXNotSupportedException err) {
// tryAgain = true;
// }
// if (tryAgain) {
// try {
// // This feature name is supported in the version of Xerces bundled with JDK 1.5
// parser.setFeature(name + "-aware", value);
// } catch (SAXNotRecognizedException err) {
// throw new XPathException(namedParser(parser) +
// " does not recognize request for XInclude processing", err);
// } catch (SAXNotSupportedException err) {
// throw new XPathException(namedParser(parser) +
// " does not support XInclude processing", err);
// }
// }
// } else {
// parser.setFeature(entry.getKey(), entry.getValue());
// }
// } catch (SAXNotRecognizedException err) {
// // No warning if switching a feature off doesn't work: bugs 2540 and 2551
// if (entry.getValue()) {
// config.getLogger().warning(namedParser(parser) + " does not recognize the feature " + entry.getKey());
// }
// } catch (SAXNotSupportedException err) {
// if (entry.getValue()) {
// config.getLogger().warning(namedParser(parser) + " does not support the feature " + entry.getKey());
// }
// }
// }
// }
//
// if (parserProperties != null) {
// for (Map.Entry entry : parserProperties.entrySet()) {
// try {
// parser.setProperty(entry.getKey(), entry.getValue());
// } catch (SAXNotRecognizedException err) {
// config.getLogger().warning(namedParser(parser) + " does not recognize the property " + entry.getKey());
// } catch (SAXNotSupportedException err) {
// config.getLogger().warning(namedParser(parser) + " does not support the property " + entry.getKey());
// }
//
// }
// }
//
// boolean xInclude = options.isXIncludeAware();
// if (xInclude) {
// boolean tryAgain = false;
// try {
// // This feature name is supported in the version of Xerces bundled with JDK 1.5
// parser.setFeature("http://apache.org/xml/features/xinclude-aware", true);
// } catch (SAXNotRecognizedException | SAXNotSupportedException err) {
// tryAgain = true;
// }
// if (tryAgain) {
// try {
// // This feature name is supported in Xerces 2.9.0
// parser.setFeature("http://apache.org/xml/features/xinclude", true);
// } catch (SAXNotRecognizedException err) {
// throw new XPathException(namedParser(parser) +
// " does not recognize request for XInclude processing", err);
// } catch (SAXNotSupportedException err) {
// throw new XPathException(namedParser(parser) +
// " does not support XInclude processing", err);
// }
// }
// }
//// if (config.isTiming()) {
//// System.err.println("Using SAX parser " + parser);
//// }
//
//
// receiver = Sender.makeValidator(receiver, source.getSystemId(), options);
//
// // Reuse the previous ReceivingContentHandler if possible (it contains a useful cache of names)
//
// ReceivingContentHandler ce;
// final ContentHandler ch = parser.getContentHandler();
// if (ch instanceof ReceivingContentHandler && config.isCompatible(((ReceivingContentHandler) ch).getConfiguration())) {
// ce = (ReceivingContentHandler) ch;
// ce.reset();
// } else {
// ce = new ReceivingContentHandler();
// parser.setContentHandler(ce);
// parser.setDTDHandler(ce);
// try {
// parser.setProperty("http://xml.org/sax/properties/lexical-handler", ce);
// } catch (SAXNotSupportedException | SAXNotRecognizedException err) {
// // this just means we won't see the comments
// // ignore the error
// }
// }
//// TracingFilter tf = new TracingFilter();
//// tf.setUnderlyingReceiver(receiver);
//// tf.setPipelineConfiguration(pipe);
//// receiver = tf;
//
// ce.setReceiver(receiver);
// ce.setPipelineConfiguration(pipe);
//
// try {
// parser.parse(source.getInputSource());
// } catch (SAXException err) {
// Exception nested = err.getException();
// if (nested instanceof XPathException) {
// throw (XPathException) nested;
// } else if (nested instanceof RuntimeException) {
// throw (RuntimeException) nested;
// } else {
// // Check for a couple of conditions where the error reporting needs to be improved.
// // (a) The built-in parser for JDK 1.6 has a nasty habit of not notifying errors to the ErrorHandler
// // (b) Sometimes (e.g. when given an empty file), the SAXException has no location information
// if ((errorHandler instanceof StandardErrorHandler && ((StandardErrorHandler) errorHandler).getFatalErrorCount() == 0) ||
// (err instanceof SAXParseException && ((SAXParseException) err).getSystemId() == null && source.getSystemId() != null)) {
// //
// XPathException de = new XPathException("Error reported by XML parser processing " +
// source.getSystemId() + ": " + err.getMessage(), err);
// listener.report(new XmlProcessingException(de));
// de.setHasBeenReported(true);
// throw de;
// } else {
// XPathException de = new XPathException(err);
// de.setErrorCode(SaxonErrorCode.SXXP0003);
// de.setHasBeenReported(true);
// throw de;
// }
// }
// } catch (java.io.IOException err) {
// throw new XPathException("I/O error reported by XML parser processing " +
// source.getSystemId() + ": " + err.getMessage(), err);
// }
// if (errorHandler instanceof StandardErrorHandler) {
// int errs = ((StandardErrorHandler) errorHandler).getFatalErrorCount();
// if (errs > 0) {
// throw new XPathException("The XML parser reported " + errs + (errs == 1 ? " error" : " errors"));
// }
// errs = ((StandardErrorHandler) errorHandler).getErrorCount();
// if (errs > 0) {
// String message = "The XML parser reported " + new Numberer_en().toWords(errs).toLowerCase() +
// " validation error" + (errs == 1 ? "" : "s");
// if (dtdRecover) {
// message += ". Processing continues, because recovery from validation errors was requested";
// XmlProcessingIncident warning = new XmlProcessingIncident(message).asWarning();
// listener.report(warning);
// } else {
// throw new XPathException(message);
// }
// }
// }
// if (reuseParser) {
// config.reuseSourceParser(parser);
// }
// }
private static String namedParser(XMLReader parser) {
return "Selected XML parser " + parser.getClass().getName();
}
/**
* Configure a SAX parser to ensure it has the correct namespace properties set
*
* @param parser the parser to be configured
* @throws XPathException if the parser cannot be configured to the
* required settings (namespaces=true, namespace-prefixes=false). Note that the SAX
* specification requires every XMLReader to support these settings, so this error implies
* that the XMLReader is non-conformant; this is not uncommon in cases where the XMLReader
* is user-written.
*/
public static void configureParser(XMLReader parser) throws XPathException {
try {
parser.setFeature("http://xml.org/sax/features/namespaces", true);
} catch (SAXNotSupportedException err) { // SAX2 parsers MUST support this feature!
throw new XPathException(
"The SAX2 parser " + parser.getClass().getName() +
" does not recognize the 'namespaces' feature", err);
} catch (SAXNotRecognizedException err) {
throw new XPathException(
"The SAX2 parser " + parser.getClass().getName() +
" does not support setting the 'namespaces' feature to true", err);
}
try {
parser.setFeature("http://xml.org/sax/features/namespace-prefixes", false);
} catch (SAXNotSupportedException err) { // SAX2 parsers MUST support this feature!
throw new XPathException(
"The SAX2 parser " + parser.getClass().getName() +
" does not recognize the 'namespace-prefixes' feature", err);
} catch (SAXNotRecognizedException err) {
throw new XPathException(
"The SAX2 parser " + parser.getClass().getName() +
" does not support setting the 'namespace-prefixes' feature to false", err);
}
}
}