All Downloads are FREE. Search and download functionalities are using the official Maven repository.

net.shibboleth.utilities.java.support.xml.BasicParserPool Maven / Gradle / Ivy

There is a newer version: 8.0.0
Show newest version
/*
 * Licensed to the University Corporation for Advanced Internet Development,
 * Inc. (UCAID) under one or more contributor license agreements.  See the
 * NOTICE file distributed with this work for additional information regarding
 * copyright ownership. The UCAID licenses this file to You under the Apache
 * License, Version 2.0 (the "License"); you may not use this file except in
 * compliance with the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package net.shibboleth.utilities.java.support.xml;

import java.io.File;
import java.io.IOException;
import java.io.InputStream;
import java.io.Reader;
import java.lang.ref.SoftReference;
import java.util.Collections;
import java.util.HashMap;
import java.util.Map;
import java.util.Stack;

import javax.annotation.Nonnull;
import javax.annotation.Nullable;
import javax.annotation.concurrent.ThreadSafe;
import javax.xml.XMLConstants;
import javax.xml.parsers.DocumentBuilder;
import javax.xml.parsers.DocumentBuilderFactory;
import javax.xml.parsers.ParserConfigurationException;
import javax.xml.validation.Schema;

import net.shibboleth.utilities.java.support.annotation.constraint.NonnullElements;
import net.shibboleth.utilities.java.support.annotation.constraint.NotEmpty;
import net.shibboleth.utilities.java.support.annotation.constraint.NullableElements;
import net.shibboleth.utilities.java.support.annotation.constraint.Unmodifiable;
import net.shibboleth.utilities.java.support.component.AbstractInitializableComponent;
import net.shibboleth.utilities.java.support.component.ComponentInitializationException;
import net.shibboleth.utilities.java.support.component.ComponentSupport;
import net.shibboleth.utilities.java.support.logic.Constraint;
import net.shibboleth.utilities.java.support.primitive.StringSupport;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.w3c.dom.DOMImplementation;
import org.w3c.dom.Document;
import org.xml.sax.EntityResolver;
import org.xml.sax.ErrorHandler;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;

import com.google.common.base.Predicates;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.Maps;

//TODO(lajoie) see if we can use either java.util.concurrent or Guava 
// classes for the pool so we don't have to manage synchronicity

/**
 * A pool of JAXP 1.3 {@link DocumentBuilder}s.
 * 
 * This is a pool implementation of the caching factory variety, and as such imposes no upper bound on the number of
 * DocumentBuilders allowed to be concurrently checked out and in use. It does however impose a limit on the size of the
 * internal cache of idle builder instances via the value configured via {@link #setMaxPoolSize(int)}.
 * 
 * Builders retrieved from this pool may (but are not required to) be returned to the pool with the method
 * {@link #returnBuilder(DocumentBuilder)}.
 * 
 * References to builders are kept by way of {@link SoftReference} so that the garbage collector may reap the builders
 * if the system is running out of memory.
 * 
 * This implementation of {@link ParserPool} does not allow its properties to be modified once it has been initialized.
 */
@ThreadSafe
public class BasicParserPool extends AbstractInitializableComponent implements ParserPool {

    /** Class logger. */
    @Nonnull private final Logger log = LoggerFactory.getLogger(BasicParserPool.class);
    
    /** Name of security manager attribute, if any. */
    @Nullable private String securityManagerAttributeName;

    /** Factory used to create new builders. */
    private DocumentBuilderFactory builderFactory;

    /** Cache of document builders. */
    @Nonnull @NotEmpty private final Stack> builderPool;

    /** Max number of builders allowed in the pool. Default value: 5 */
    private int maxPoolSize;

    /** Builder attributes. */
    @Nonnull private Map builderAttributes;

    /** Whether the builders are coalescing. Default value: true */
    private boolean coalescing;

    /** Whether the builders expand entity references. Default value: false */
    private boolean expandEntityReferences;

    /** Builder features. */
    @Nonnull private Map builderFeatures;

    /** Whether the builders ignore comments. Default value: true */
    private boolean ignoreComments;

    /** Whether the builders ignore element content whitespace. Default value: true */
    private boolean ignoreElementContentWhitespace;

    /** Whether the builders are namespace aware. Default value: true */
    private boolean namespaceAware;

    /** Schema used to validate parsed content. */
    private Schema schema;

    /** Whether the builder should validate. Default value: false */
    private boolean dtdValidating;

    /** Whether the builders are XInclude aware. Default value: false */
    private boolean xincludeAware;

    /** Entity resolver used by builders. */
    private EntityResolver entityResolver;

    /** Error handler used by builders. */
    private ErrorHandler errorHandler;

    /** Constructor. */
    public BasicParserPool() {
        maxPoolSize = 5;
        builderPool = new Stack<>();
        builderAttributes = Collections.emptyMap();
        coalescing = true;
        expandEntityReferences = false;
        builderFeatures = buildDefaultFeatures();
        ignoreComments = true;
        ignoreElementContentWhitespace = true;
        namespaceAware = true;
        schema = null;
        dtdValidating = false;
        xincludeAware = false;
        errorHandler = new LoggingErrorHandler(log);
    }

    /** {@inheritDoc} */
    @Override
    @Nonnull public DocumentBuilder getBuilder() throws XMLParserException {
        checkInitializedNotDestroyed();

        DocumentBuilder builder = null;

        synchronized (builderPool) {
            while (builder == null && !builderPool.isEmpty()) {
                builder = builderPool.pop().get();
            }
        }

        // Will be null if either the stack was empty, or the SoftReference
        // has been garbage-collected
        if (builder == null) {
            builder = createBuilder();
        }

        if (builder != null) {
            prepareBuilder(builder);
            return new DocumentBuilderProxy(builder, this);
        }

        throw new XMLParserException("Unable to obtain a DocumentBuilder");
    }

//CheckStyle: ReturnCount OFF
    /** {@inheritDoc} */
    @Override public void returnBuilder(@Nullable final DocumentBuilder builder) {
        checkInitializedNotDestroyed();

        if (builder == null || !(builder instanceof DocumentBuilderProxy)) {
            return;
        }

        final DocumentBuilderProxy proxiedBuilder = (DocumentBuilderProxy) builder;
        if (proxiedBuilder.getOwningPool() != this) {
            return;
        }

        synchronized (proxiedBuilder) {
            if (proxiedBuilder.isReturned()) {
                return;
            }
            // Not strictly true in that it may not actually be pushed back
            // into the cache, depending on builderPool.size() below. But
            // that's ok. returnBuilder() shouldn't normally be called twice
            // on the same builder instance anyway, and it also doesn't matter
            // whether a builder is ever logically returned to the pool.
            proxiedBuilder.setReturned(true);
        }

        final DocumentBuilder unwrappedBuilder = proxiedBuilder.getProxiedBuilder();
        unwrappedBuilder.reset();
        final SoftReference builderReference = new SoftReference<>(unwrappedBuilder);

        synchronized (builderPool) {
            if (builderPool.size() < maxPoolSize) {
                builderPool.push(builderReference);
            }
        }
    }
  //CheckStyle: ReturnCount ON

    /** {@inheritDoc} */
    @Override
    @Nonnull public Document newDocument() throws XMLParserException {
        checkInitializedNotDestroyed();

        DocumentBuilder builder = null;
        final Document document;

        try {
            builder = getBuilder();
            document = builder.newDocument();
        } finally {
            returnBuilder(builder);
        }
        
        if (document == null) {
            throw new XMLParserException("DocumentBuilder returned a null Document");
        }

        return document;
    }

    /** {@inheritDoc} */
    @Override
    @Nonnull public Document parse(@Nonnull final InputStream input) throws XMLParserException {
        checkInitializedNotDestroyed();

        Constraint.isNotNull(input, "Input stream can not be null");

        final DocumentBuilder builder = getBuilder();
        try {
            final Document document = builder.parse(input);
            if (document == null) {
                throw new XMLParserException("DocumentBuilder parsed a null Document");
            }
            return document;
        } catch (final SAXException e) {
            throw new XMLParserException("Unable to parse inputstream, it contained invalid XML", e);
        } catch (final IOException e) {
            throw new XMLParserException("Unable to read data from input stream", e);
        } finally {
            returnBuilder(builder);
        }
    }

    /** {@inheritDoc} */
    @Override
    @Nonnull public Document parse(@Nonnull final Reader input) throws XMLParserException {
        checkInitializedNotDestroyed();

        Constraint.isNotNull(input, "Input reader can not be null");

        final DocumentBuilder builder = getBuilder();
        try {
            final Document document = builder.parse(new InputSource(input));
            if (document == null) {
                throw new XMLParserException("DocumentBuilder parsed a null Document");
            }
            return document;
        } catch (final SAXException e) {
            throw new XMLParserException("Invalid XML", e);
        } catch (final IOException e) {
            throw new XMLParserException("Unable to read XML from input stream", e);
        } finally {
            returnBuilder(builder);
        }
    }
    
    /**
     * Set the name of the builder attribute that controls the use of an XMLSecurityManager.
     * 
     * 

If set, this allows the pool to interrogate the factory to determine whether a * security manager is installed and log its class.<.p> * * @param name name of attribute */ public void setSecurityManagerAttributeName(@Nullable final String name) { checkNotInitializedNotDestroyed(); securityManagerAttributeName = StringSupport.trimOrNull(name); } /** * Gets the max number of builders the pool will hold. * * @return max number of builders the pool will hold */ public int getMaxPoolSize() { return maxPoolSize; } /** * Sets the max number of builders the pool will hold. * * @param newSize max number of builders the pool will hold */ public void setMaxPoolSize(final int newSize) { checkNotInitializedNotDestroyed(); maxPoolSize = (int) Constraint.isGreaterThan(0, newSize, "New maximum pool size must be greater than 0"); } /** * Gets the builder attributes used when creating builders. This collection is unmodifiable. * * @return builder attributes used when creating builders */ @Nonnull @NonnullElements public Map getBuilderAttributes() { return Collections.unmodifiableMap(builderAttributes); } /** * Sets the builder attributes used when creating builders. * * @param newAttributes builder attributes used when creating builders */ public void setBuilderAttributes(@Nullable @NullableElements final Map newAttributes) { checkNotInitializedNotDestroyed(); if (newAttributes == null) { builderAttributes = Collections.emptyMap(); } else { builderAttributes = new HashMap<>(Maps.filterKeys(newAttributes, Predicates.notNull())); } } /** * Gets whether the builders are coalescing. * * @return whether the builders are coalescing */ public boolean isCoalescing() { return coalescing; } /** * Sets whether the builders are coalescing. * * @param isCoalescing whether the builders are coalescing */ public void setCoalescing(final boolean isCoalescing) { checkNotInitializedNotDestroyed(); coalescing = isCoalescing; } /** * Gets whether builders expand entity references. * * @return whether builders expand entity references */ public boolean isExpandEntityReferences() { return expandEntityReferences; } /** * Sets whether builders expand entity references. * * @param expand whether builders expand entity references */ public void setExpandEntityReferences(final boolean expand) { checkNotInitializedNotDestroyed(); expandEntityReferences = expand; } /** * Gets the builders' features. This collection is unmodifiable. * * @return the builders' features */ @Nonnull @NonnullElements @Unmodifiable public Map getBuilderFeatures() { return builderFeatures; } /** * Sets the the builders' features. * * @param newFeatures the builders' features */ public void setBuilderFeatures(@Nullable @NullableElements final Map newFeatures) { checkNotInitializedNotDestroyed(); if (newFeatures == null) { builderFeatures = Collections.emptyMap(); } else { builderFeatures = ImmutableMap.copyOf(Maps.filterKeys(newFeatures, Predicates.notNull())); } } /** * Gets whether the builders ignore comments. * * @return whether the builders ignore comments */ public boolean isIgnoreComments() { return ignoreComments; } /** * Sets whether the builders ignore comments. * * @param ignore The ignoreComments to set. */ public void setIgnoreComments(final boolean ignore) { checkNotInitializedNotDestroyed(); ignoreComments = ignore; } /** * Get whether the builders ignore element content whitespace. * * @return whether the builders ignore element content whitespace */ public boolean isIgnoreElementContentWhitespace() { return ignoreElementContentWhitespace; } /** * Sets whether the builders ignore element content whitespace. * * @param ignore whether the builders ignore element content whitespace */ public void setIgnoreElementContentWhitespace(final boolean ignore) { checkNotInitializedNotDestroyed(); ignoreElementContentWhitespace = ignore; } /** * Gets whether the builders are namespace aware. * * @return whether the builders are namespace aware */ public boolean isNamespaceAware() { return namespaceAware; } /** * Sets whether the builders are namespace aware. * * @param isNamespaceAware whether the builders are namespace aware */ public void setNamespaceAware(final boolean isNamespaceAware) { checkNotInitializedNotDestroyed(); namespaceAware = isNamespaceAware; } /** * Gets the schema used to validate the XML document during the parsing process. * * @return schema used to validate the XML document during the parsing process */ @Nullable public Schema getSchema() { return schema; } /** * Sets the schema used to validate the XML document during the parsing process. * * @param newSchema schema used to validate the XML document during the parsing process */ public void setSchema(@Nullable final Schema newSchema) { checkNotInitializedNotDestroyed(); schema = newSchema; if (schema != null) { setNamespaceAware(true); builderAttributes.remove("http://java.sun.com/xml/jaxp/properties/schemaSource"); builderAttributes.remove("http://java.sun.com/xml/jaxp/properties/schemaLanguage"); } } /** * Gets the {@link EntityResolver}. * * @return the configured entity resolver, may be null */ @Nullable public EntityResolver getEntityResolver() { return entityResolver; } /** * Sets the {@link EntityResolver}. * * @param resolver the new entity resolver, may be null */ public void setEntityResolver(@Nullable final EntityResolver resolver) { checkNotInitializedNotDestroyed(); entityResolver = resolver; } /** * Gets the {@link ErrorHandler}. * * @return the configured error handler */ @Nonnull public ErrorHandler getErrorHandler() { return errorHandler; } /** * Sets the {@link ErrorHandler}. * * @param handler the new error handler */ public void setErrorHandler(@Nonnull final ErrorHandler handler) { checkNotInitializedNotDestroyed(); errorHandler = Constraint.isNotNull(handler, "ErrorHandler may not be null"); } /** * Gets whether the builders are validating. * * @return whether the builders are validating */ public boolean isDTDValidating() { return dtdValidating; } /** * Sets whether the builders are validating. * * @param isValidating whether the builders are validating */ public void setDTDValidating(final boolean isValidating) { checkNotInitializedNotDestroyed(); dtdValidating = isValidating; } /** * Gets whether the builders are XInclude aware. * * @return whether the builders are XInclude aware */ public boolean isXincludeAware() { return xincludeAware; } /** * Sets whether the builders are XInclude aware. * * @param isXIncludeAware whether the builders are XInclude aware */ public void setXincludeAware(final boolean isXIncludeAware) { checkNotInitializedNotDestroyed(); xincludeAware = isXIncludeAware; } /** * Gets the size of the current pool storage. * * @return current pool storage size */ protected int getPoolSize() { return builderPool.size(); } /** * Creates a new document builder. * * @return newly created document builder * * @throws XMLParserException thrown if their is a configuration error with the builder factory */ @Nonnull protected DocumentBuilder createBuilder() throws XMLParserException { checkInitializedNotDestroyed(); try { final DocumentBuilder builder = builderFactory.newDocumentBuilder(); return builder; } catch (final ParserConfigurationException e) { log.debug("Unable to create new document builder", e); throw new XMLParserException("Unable to create new document builder", e); } } /** * Prepare a document builder instance for use, before returning it from a checkout call. * * @param builder the document builder to prepare */ private void prepareBuilder(@Nonnull final DocumentBuilder builder) { if (entityResolver != null) { builder.setEntityResolver(entityResolver); } builder.setErrorHandler(errorHandler); } /** * Initialize the pool. * * @throws ComponentInitializationException thrown if pool can not be initialized, or if it is already initialized * {@inheritDoc} */ @Override protected void doInitialize() throws ComponentInitializationException { super.doInitialize(); try { final DocumentBuilderFactory newFactory = DocumentBuilderFactory.newInstance(); for (final Map.Entry attribute : builderAttributes.entrySet()) { newFactory.setAttribute(attribute.getKey(), attribute.getValue()); } for (final Map.Entry feature : builderFeatures.entrySet()) { if (feature.getKey() != null) { newFactory.setFeature(feature.getKey(), feature.getValue().booleanValue()); } } newFactory.setCoalescing(coalescing); newFactory.setExpandEntityReferences(expandEntityReferences); newFactory.setIgnoringComments(ignoreComments); newFactory.setIgnoringElementContentWhitespace(ignoreElementContentWhitespace); newFactory.setNamespaceAware(namespaceAware); newFactory.setSchema(schema); newFactory.setValidating(dtdValidating); newFactory.setXIncludeAware(xincludeAware); builderFactory = newFactory; if (securityManagerAttributeName != null) { final Object securityManager = builderFactory.getAttribute(securityManagerAttributeName); if (securityManager != null) { log.info("XMLSecurityManager of type '{}' is installed", securityManager.getClass().getName()); } else { log.warn( "No XMLSecurityManager installed, system may be vulnerable to XML processing vulnerabilities"); } } } catch (final ParserConfigurationException e) { throw new ComponentInitializationException("Unable to configure builder factory", e); } } /** {@inheritDoc} */ @Override protected void doDestroy() { builderPool.clear(); super.doDestroy(); } /** Helper method to test class state. */ private void checkInitializedNotDestroyed() { ComponentSupport.ifNotInitializedThrowUninitializedComponentException(this); ComponentSupport.ifDestroyedThrowDestroyedComponentException(this); } /** Helper method to test class state. */ private void checkNotInitializedNotDestroyed() { ComponentSupport.ifInitializedThrowUnmodifiabledComponentException(this); ComponentSupport.ifDestroyedThrowDestroyedComponentException(this); } /** * Build the default set of parser features to use. * *

These will be overriden by a call to {@link #setBuilderFeatures(Map)}.

* *

* The default features set are: *

    *
  • {@link javax.xml.XMLConstants#FEATURE_SECURE_PROCESSING} = true
  • *
  • http://apache.org/xml/features/disallow-doctype-decl = true
  • *
*

* * @return the default features map */ protected Map buildDefaultFeatures() { final HashMap features = new HashMap<>(); features.put(XMLConstants.FEATURE_SECURE_PROCESSING, true); features.put("http://apache.org/xml/features/disallow-doctype-decl", true); return features; } /** A proxy that prevents the manages document builders retrieved from the parser pool. */ protected class DocumentBuilderProxy extends DocumentBuilder { /** Builder being proxied. */ private final DocumentBuilder builder; /** Pool that owns this parser. */ private final ParserPool owningPool; /** Track accounting state of whether this builder has been returned to the owning pool. */ private boolean returned; /** * Constructor. * * @param target document builder to proxy * @param owner the owning pool */ public DocumentBuilderProxy(final DocumentBuilder target, final BasicParserPool owner) { owningPool = owner; builder = target; returned = false; } /** {@inheritDoc} */ @Override public DOMImplementation getDOMImplementation() { checkValidState(); return builder.getDOMImplementation(); } /** {@inheritDoc} */ @Override public Schema getSchema() { checkValidState(); return builder.getSchema(); } /** {@inheritDoc} */ @Override public boolean isNamespaceAware() { checkValidState(); return builder.isNamespaceAware(); } /** {@inheritDoc} */ @Override public boolean isValidating() { checkValidState(); return builder.isValidating(); } /** {@inheritDoc} */ @Override public boolean isXIncludeAware() { checkValidState(); return builder.isXIncludeAware(); } /** {@inheritDoc} */ @Override public Document newDocument() { checkValidState(); return builder.newDocument(); } /** {@inheritDoc} */ @Override public Document parse(final File f) throws SAXException, IOException { checkValidState(); return builder.parse(f); } /** {@inheritDoc} */ @Override public Document parse(final InputSource is) throws SAXException, IOException { checkValidState(); return builder.parse(is); } /** {@inheritDoc} */ @Override public Document parse(final InputStream is) throws SAXException, IOException { checkValidState(); return builder.parse(is); } /** {@inheritDoc} */ @Override public Document parse(final InputStream is, final String systemId) throws SAXException, IOException { checkValidState(); return builder.parse(is, systemId); } /** {@inheritDoc} */ @Override public Document parse(final String uri) throws SAXException, IOException { checkValidState(); return builder.parse(uri); } /** {@inheritDoc} */ @Override public void reset() { // ignore, entity resolver and error handler can't be changed } /** {@inheritDoc} */ @Override public void setEntityResolver(final EntityResolver er) { checkValidState(); return; } /** {@inheritDoc} */ @Override public void setErrorHandler(final ErrorHandler eh) { checkValidState(); return; } /** * Gets the pool that owns this parser. * * @return pool that owns this parser */ protected ParserPool getOwningPool() { return owningPool; } /** * Gets the proxied document builder. * * @return proxied document builder */ protected DocumentBuilder getProxiedBuilder() { return builder; } /** * Check accounting state as to whether this parser has been returned to the owning pool. * * @return true if parser has been returned to the owning pool, otherwise false */ protected boolean isReturned() { return returned; } /** * Set accounting state as to whether this parser has been returned to the owning pool. * * @param isReturned set true to indicate that parser has been returned to the owning pool */ protected void setReturned(final boolean isReturned) { returned = isReturned; } /** * Check whether the parser is in a valid and usable state, and if not, throw a runtime exception. */ protected void checkValidState() { if (isReturned()) { throw new IllegalStateException("DocumentBuilderProxy has already been returned to its owning pool"); } } /** {@inheritDoc} */ @Override protected void finalize() throws Throwable { super.finalize(); owningPool.returnBuilder(this); } } }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy