 
                        
        
                        
        com.ctc.wstx.dtd.DTDSubsetImpl Maven / Gradle / Ivy
/* Woodstox XML processor
 *
 * Copyright (c) 2004- Tatu Saloranta, [email protected]
 *
 * Licensed under the License specified in file LICENSE, included with
 * the source code.
 * You may not use this file except in compliance with the License.
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.ctc.wstx.dtd;
import java.text.MessageFormat;
import java.util.*;
import javax.xml.stream.Location;
import javax.xml.stream.XMLStreamException;
import javax.xml.stream.events.NotationDeclaration;
import org.codehaus.stax2.validation.*;
import com.ctc.wstx.cfg.ErrorConsts;
import com.ctc.wstx.ent.EntityDecl;
import com.ctc.wstx.exc.WstxParsingException;
import com.ctc.wstx.sr.InputProblemReporter;
import com.ctc.wstx.util.DataUtil;
import com.ctc.wstx.util.PrefixedName;
/**
 * The default implementation of {@link DTDSubset}
 */
public final class DTDSubsetImpl
    extends DTDSubset
{
    /**
     * Whether this subset is cachable. Only those external
     * subsets that do not refer to PEs defined by internal subsets (or
     * GEs via default attribute value expansion) are cachable.
     */
    final boolean mIsCachable;
    /**
     * Whether this subset has full validation information; and
     * consequently whether it will do actual validation, or just allow
     * access to type information, notations, entities, and add default
     * attribute values.
     */
    final boolean mFullyValidating;
    /**
     * Flag that indicates whether any of the elements declarared
     * has any attribute default values for namespace pseudo-attributes.
     */
    final boolean mHasNsDefaults;
    /*
    //////////////////////////////////////////////////////
    // Entity information
    //////////////////////////////////////////////////////
     */
    /**
     * Map (name-to-EntityDecl) of general entity declarations (internal,
     * external) for this DTD subset.
     */
    final HashMap mGeneralEntities;
    /**
     * Lazily instantiated List that contains all notations from
     * {@link #mGeneralEntities} (preferably in their declaration order; depends
     * on whether platform, ie. JDK version, has insertion-ordered
     * Maps available), used by DTD event Objects.
     */
    volatile transient List mGeneralEntityList = null;
    /**
     * Set of names of general entities references by this subset. Note that
     * only those GEs that are referenced by default attribute value
     * definitions count, since GEs in text content are only expanded
     * when reading documents, but attribute default values are expanded
     * when reading DTD subset itself.
     *
     * Needed
     * for determinining if external subset materially depends on definitions
     * from internal subset; if so, such subset is not cachable.
     * This also
     * means that information is not stored for non-cachable instance.
     */
    final Set mRefdGEs;
    // // // Parameter entity info:
    /**
     * Map (name-to-WEntityDeclaration) that contains all parameter entities
     * defined by this subset. May be empty if such information will not be
     * needed for use; for example, external subset's definitions are needed,
     * nor are combined DTD set's.
     */
    final HashMap mDefinedPEs;
    /**
     * Set of names of parameter entities references by this subset. Needed
     * when determinining if external subset materially depends on definitions
     * from internal subset, which is needed to know when caching external
     * subsets.
     *
     * Needed
     * for determinining if external subset materially depends on definitions
     * from internal subset; if so, such subset is not cachable.
     * This also
     * means that information is not stored for non-cachable instance.
     */
    final Set mRefdPEs;
    /*
    //////////////////////////////////////////////////////
    // Notation definitions:
    //////////////////////////////////////////////////////
     */
    /**
     * Map (name-to-NotationDecl) that this subset has defined.
     */
    final HashMap mNotations;
    /**
     * Lazily instantiated List that contains all notations from
     * {@link #mNotations} (preferably in their declaration order; depends
     * on whether platform, ie. JDK version, has insertion-ordered
     * Maps available), used by DTD event Objects.
     */
    transient List mNotationList = null;
    /*
    //////////////////////////////////////////////////////
    // Element definitions:
    //////////////////////////////////////////////////////
     */
    final HashMap mElements;
    /*
    //////////////////////////////////////////////////////
    // Life-cycle
    //////////////////////////////////////////////////////
     */
    private DTDSubsetImpl(boolean cachable,
                          HashMap genEnt, Set refdGEs,
                          HashMap paramEnt, Set peRefs,
                          HashMap notations, HashMap elements,
                          boolean fullyValidating)
    {
        mIsCachable = cachable;
        mGeneralEntities = genEnt;
        mRefdGEs = refdGEs;
        mDefinedPEs = paramEnt;
        mRefdPEs = peRefs;
        mNotations = notations;
        mElements = elements;
        mFullyValidating = fullyValidating;
        boolean anyNsDefs = false;
        if (elements != null) {
        	for (DTDElement elem : elements.values()) {
                if (elem.hasNsDefaults()) {
                    anyNsDefs = true;
                    break;
                }
            }
        }
        mHasNsDefaults = anyNsDefs;
    }
    public static DTDSubsetImpl constructInstance(boolean cachable,
                                                  HashMap genEnt, Set refdGEs,
                                                  HashMap paramEnt, Set refdPEs,
                                                  HashMap notations,
                                                  HashMap elements,
                                                  boolean fullyValidating)
    {
        return new DTDSubsetImpl(cachable, genEnt, refdGEs,
                                 paramEnt, refdPEs,
                                 notations, elements,
                                 fullyValidating);
    }
    /**
     * Method that will combine definitions from internal and external subsets,
     * producing a single DTD set.
     */
    @Override
    public DTDSubset combineWithExternalSubset(InputProblemReporter rep, DTDSubset extSubset)
        throws XMLStreamException
    {
        /* First let's see if we can just reuse GE Map used by int or ext
         * subset; (if only one has contents), or if not, combine them.
         */
        HashMap ge1 = getGeneralEntityMap();
        HashMap ge2 = extSubset.getGeneralEntityMap();
        if (ge1 == null || ge1.isEmpty()) {
            ge1 = ge2;
        } else {
            if (ge2 != null && !ge2.isEmpty()) {
                /* Internal subset Objects are never shared or reused (and by
                 * extension, neither are objects they contain), so we can just
                 * modify GE map if necessary
                 */
                combineMaps(ge1, ge2);
            }
        }
        // Ok, then, let's combine notations similarly
        HashMap n1 = getNotationMap();
        HashMap n2 = extSubset.getNotationMap();
        if (n1 == null || n1.isEmpty()) {
            n1 = n2;
        } else {
            if (n2 != null && !n2.isEmpty()) {
                /* First; let's make sure there are no colliding notation
                 * definitions: it's an error to try to redefine notations.
                 */
                checkNotations(n1, n2);
                /* Internal subset Objects are never shared or reused (and by
                 * extension, neither are objects they contain), so we can just
                 * modify notation map if necessary
                 */
                combineMaps(n1, n2);
            }
        }
        // And finally elements, rather similarly:
        HashMap e1 = getElementMap();
        HashMap e2 = extSubset.getElementMap();
        if (e1 == null || e1.isEmpty()) {
            e1 = e2;
        } else {
            if (e2 != null && !e2.isEmpty()) {
                /* Internal subset Objects are never shared or reused (and by
                 * extension, neither are objects they contain), so we can just
                 * modify element map if necessary
                 */
                combineElements(rep, e1, e2);
            }
        }
        /* Combos are not cachable, and because of that, there's no point
         * in storing any PE info either.
         */
        return constructInstance(false, ge1, null, null, null, n1, e1,
                                 mFullyValidating);
    }
    /*
    //////////////////////////////////////////////////////
    // XMLValidationSchema implementation
    //////////////////////////////////////////////////////
     */
    @Override
    public XMLValidator createValidator(ValidationContext ctxt)
        throws XMLStreamException
    {
        if (mFullyValidating) {
            return new DTDValidator(this, ctxt, mHasNsDefaults,
                                    getElementMap(), getGeneralEntityMap());
        }
        return new DTDTypingNonValidator(this, ctxt, mHasNsDefaults,
                                         getElementMap(), getGeneralEntityMap());
    }
    /*
    //////////////////////////////////////////////////////
    // DTDValidationSchema implementation
    //////////////////////////////////////////////////////
     */
    @Override
    public int getEntityCount() {
        return (mGeneralEntities == null) ? 0 : mGeneralEntities.size();
    }
    @Override
    public int getNotationCount() {
        return (mNotations == null) ? 0 : mNotations.size();
    }
    /*
    //////////////////////////////////////////////////////
    // Woodstox-specific public API
    //////////////////////////////////////////////////////
     */
    @Override
    public boolean isCachable() {
        return mIsCachable;
    }
    
    @Override
    public HashMap getGeneralEntityMap() {
        return mGeneralEntities;
    }
    @Override
    public List getGeneralEntityList()
    {
        List l = mGeneralEntityList;
        if (l == null) {
            if (mGeneralEntities == null || mGeneralEntities.size() == 0) {
                l = Collections.emptyList();
            } else {
                l = Collections.unmodifiableList(new ArrayList(mGeneralEntities.values()));
            }
            mGeneralEntityList = l;
        }
        return l;
    }
    @Override
    public HashMap getParameterEntityMap() {
        return mDefinedPEs;
    }
    @Override
    public HashMap getNotationMap() {
        return mNotations;
    }
    @Override
    public synchronized List getNotationList()
    {
        List l = mNotationList;
        if (l == null) {
            if (mNotations == null || mNotations.size() == 0) {
                l = Collections.emptyList();
            } else {
                l = Collections.unmodifiableList(new ArrayList(mNotations.values()));
            }
            mNotationList = l;
        }
        return l;
    }
    @Override
    public HashMap getElementMap() {
        return mElements;
    }
    /**
     * Method used in determining whether cached external subset instance
     * can be used with specified internal subset. If ext. subset references
     * any parameter/general entities int subset (re-)defines, it can not;
     * otherwise it can be used.
     *
     * @return True if this (external) subset refers to a parameter entity
     *    defined in passed-in internal subset.
     */
    @Override
    public boolean isReusableWith(DTDSubset intSubset)
    {
        Set refdPEs = mRefdPEs;
        if (refdPEs != null && refdPEs.size() > 0) {
            HashMap intPEs = intSubset.getParameterEntityMap();
            if (intPEs != null && intPEs.size() > 0) {
                if (DataUtil.anyValuesInCommon(refdPEs, intPEs.keySet())) {
                    return false;
                }
            }
        }
        Set refdGEs = mRefdGEs;
        if (refdGEs != null && refdGEs.size() > 0) {
            HashMap intGEs = intSubset.getGeneralEntityMap();
            if (intGEs != null && intGEs.size() > 0) {
                if (DataUtil.anyValuesInCommon(refdGEs, intGEs.keySet())) {
                    return false;
                }
            }
        }
        return true; // yep, no dependencies overridden
    }
    /*
    //////////////////////////////////////////////////////
    // Overridden default methods:
    //////////////////////////////////////////////////////
     */
    @Override
    public String toString() {
        StringBuilder sb = new StringBuilder();
        sb.append("[DTDSubset: ");
        int count = getEntityCount();
        sb.append(count);
        sb.append(" general entities");
        sb.append(']');
        return sb.toString();
    }
    /*
    //////////////////////////////////////////////////////
    // Convenience methods used by other classes
    //////////////////////////////////////////////////////
     */
   public static void throwNotationException(NotationDeclaration oldDecl, NotationDeclaration newDecl)
        throws XMLStreamException
    {
        throw new WstxParsingException
            (MessageFormat.format(ErrorConsts.ERR_DTD_NOTATION_REDEFD,
                                  new Object[] {
                                  newDecl.getName(),
                                  oldDecl.getLocation().toString()}),
             newDecl.getLocation());
    }
   public static void throwElementException(DTDElement oldElem, Location loc)
        throws XMLStreamException
    {
        throw new WstxParsingException
            (MessageFormat.format(ErrorConsts.ERR_DTD_ELEM_REDEFD,
                                  new Object[] {
                                  oldElem.getDisplayName(),
                                  oldElem.getLocation().toString() }),
             loc);
    }
    /*
    //////////////////////////////////////////////////////
    // Internal methods
    //////////////////////////////////////////////////////
     */
    /**
     *
     * Note: The first Map argument WILL be modified; second one
     * not. Caller needs to ensure this is acceptable.
     */
    private static  void combineMaps(Map m1, Map m2)
    {
    	for (Map.Entry me : m2.entrySet()) {
            K key = me.getKey();
            /* Int. subset has precedence, but let's guess most of
             * the time there are no collisions:
             */
            V old = m1.put(key, me.getValue());
            // Oops, got value! Let's put it back
            if (old != null) {
                m1.put(key, old);
            }
        }
    }
    /**
     * Method that will try to merge in elements defined in the external
     * subset, into internal subset; it will also check for redeclarations
     * when doing this, as it's invalid to redeclare elements. Care has to
     * be taken to only check actual redeclarations: placeholders should
     * not cause problems.
     */
    private void combineElements(InputProblemReporter rep, HashMap intElems, HashMap extElems)
        throws XMLStreamException
    {
    	for (Map.Entry me : extElems.entrySet()) {
            PrefixedName key = me.getKey();
            DTDElement extElem = me.getValue();
            DTDElement intElem = intElems.get(key);
            // If there was no old value, can just merge new one in and continue
            if (intElem == null) {
                intElems.put(key, extElem);
                continue;
            }
            // Which one is defined (if either)?
            if (extElem.isDefined()) { // one from the ext subset
                if (intElem.isDefined()) { // but both can't be; that's an error
                    throwElementException(intElem, extElem.getLocation());
                } else {
                    /* Note: can/should not modify the external element (by
                     * for example adding attributes); external element may
                     * be cached and shared... so, need to do the reverse,
                     * define the one from internal subset.
                     */
                    intElem.defineFrom(rep, extElem, mFullyValidating);
                }
            } else {
                if (!intElem.isDefined()) {
                    /* ??? Should we warn about neither of them being really
                     *   declared?
                     */
                    rep.reportProblem(intElem.getLocation(),
                                      ErrorConsts.WT_ENT_DECL,
                                      ErrorConsts.W_UNDEFINED_ELEM,
                                      extElem.getDisplayName(), null);
                                      
                } else {
                    intElem.mergeMissingAttributesFrom(rep, extElem, mFullyValidating);
                }
            }
        }
    }
    private static void checkNotations(HashMap fromInt, HashMap fromExt)
        throws XMLStreamException
    {
        /* Since it's external subset that would try to redefine things
         * defined in internal subset, let's traverse definitions in
         * the ext. subset first (even though that may not be the fastest
         * way), so that we have a chance of catching the first problem
         * (As long as Maps iterate in insertion order).
         */
    	for (Map.Entry en : fromExt.entrySet()) {
            if (fromInt.containsKey(en.getKey())) {
                throwNotationException(fromInt.get(en.getKey()), en.getValue());
            }
        }
    }
}