All Downloads are FREE. Search and download functionalities are using the official Maven repository.

net.sf.saxon.trans.KeyIndex Maven / Gradle / Ivy

There is a newer version: 12.5
Show newest version
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////
// Copyright (c) 2013 Saxonica Limited.
// This Source Code Form is subject to the terms of the Mozilla Public License, v. 2.0.
// If a copy of the MPL was not distributed with this file, You can obtain one at http://mozilla.org/MPL/2.0/.
// This Source Code Form is “Incompatible With Secondary Licenses”, as defined by the Mozilla Public License, v. 2.0.
////////////////////////////////////////////////////////////////////////////////////////////////////////////////////

package net.sf.saxon.trans;

import net.sf.saxon.expr.Expression;
import net.sf.saxon.expr.XPathContext;
import net.sf.saxon.expr.XPathContextMajor;
import net.sf.saxon.expr.instruct.SlotManager;
import net.sf.saxon.expr.sort.AtomicMatchKey;
import net.sf.saxon.expr.sort.CodepointMatchKey;
import net.sf.saxon.expr.sort.LocalOrderComparer;
import net.sf.saxon.lib.ConversionRules;
import net.sf.saxon.lib.StringCollator;
import net.sf.saxon.om.*;
import net.sf.saxon.pattern.Pattern;
import net.sf.saxon.tree.iter.ManualIterator;
import net.sf.saxon.type.BuiltInAtomicType;
import net.sf.saxon.type.StringConverter;
import net.sf.saxon.type.UType;
import net.sf.saxon.value.AtomicValue;
import net.sf.saxon.value.UntypedAtomicValue;

import java.util.*;

/**
 * A key index is an index maintained to support xsl:key key definitions, including both user-defined
 * keys and keys added by the optimizer. Each key index supports one key definition (a set of xsl:key
 * declarations with the same name) applied to one document tree.
 *
 * The index can support a mixture of atomic keys of different types; there is no error caused by comparing
 * values of different types. This relies on the fact that XPathComparable values are identical for comparable
 * values (e.g. integers and doubles), and distinct otherwise.
 *
 * With the XSLT xsl:key construct, untypedAtomic values are treated as strings. However, this structure is
 * also used to support internally-generated keys with general comparison semantics, where untyped values
 * are converted to the type of the other operand. To enable this to work, we maintain a list of all
 * untypedAtomic keys present in the index; and if a search is made for some type like xs:date, we then go
 * through this list converting each untypedAtomic value to a date and indexing it as such. In principle this
 * can happen for an arbitrary number of data types, though it is unlikely in practice because not many
 * types have overlapping lexical spaces.
 */
public class KeyIndex {

    private Map > index;
    private UType keyTypesPresent = UType.VOID;
    private UType keyTypesConvertedFromUntyped = UType.STRING_LIKE;
    private List  untypedKeys;
    private ConversionRules rules;
    private int implicitTimezone;
    private StringCollator collation;

    public KeyIndex(boolean isRangeKey) {
        index = isRangeKey ?
                        new TreeMap>() :
                        new HashMap>(100);
    }

    /**
     * Get the underlying map
     * @return the underlying map
     */

    public Map > getUnderlyingMap() {
        return index;
    }

    /**
     * Build the index for a particular document for a named key
     *
     *
     * @param keySet         The set of key definitions with this name
     * @param doc            The source document in question
     * @param context        The dynamic context
     * @throws XPathException if a dynamic error is encountered
     */


    public void buildIndex(KeyDefinitionSet keySet,
                           TreeInfo doc,
                           XPathContext context) throws XPathException {

        List definitions = keySet.getKeyDefinitions();

        // There may be multiple xsl:key definitions with the same name. Index them all.
        for (int k = 0; k < definitions.size(); k++) {
            constructIndex(doc, definitions.get(k), context, k == 0);
        }
        this.rules = context.getConfiguration().getConversionRules();
        this.implicitTimezone = context.getImplicitTimezone();
        this.collation = definitions.get(0).getCollation();
    }

    /**
     * Process one key definition to add entries to the index
     *
     *
     * @param doc            the document to be indexed
     * @param keydef         the key definition used to build the index
     * @param context        the XPath dynamic evaluation context
     * @param isFirst        true if this is the first index to be built for this key
     * @throws XPathException if a dynamic error is encountered
     */

    private void constructIndex(TreeInfo doc,
                                KeyDefinition keydef,
                                XPathContext context,
                                boolean isFirst) throws XPathException {
        //System.err.println("build index for doc " + doc.getDocumentNumber());
        Pattern match = keydef.getMatch();

        //NodeInfo curr;
        XPathContextMajor xc = context.newContext();
        xc.setOrigin(keydef);
        xc.setCurrentComponent(keydef.getDeclaringComponent());
        xc.setTemporaryOutputState(StandardNames.XSL_KEY);

        // The use expression (or sequence constructor) may contain local variables.
        SlotManager map = keydef.getStackFrameMap();
        if (map != null) {
            xc.openStackFrame(map);
        }

        SequenceIterator iter = match.selectNodes(doc, xc);
        Item node;
        while ((node = iter.next()) != null) {
            processNode((NodeInfo) node, keydef, xc, isFirst);
        }
    }

    /**
     * Process one matching node, adding entries to the index if appropriate
     *
     *
     * @param node           the node being processed
     * @param keydef         the key definition
     * @param xc             the context for evaluating expressions
     * @param isFirst        indicates whether this is the first key definition with a given key name (which means
     *                       no sort of the resulting key entries is required)
     * @throws XPathException if a dynamic error is encountered
     */

    private void processNode(NodeInfo node,
                             KeyDefinition keydef,
                             XPathContext xc,
                             boolean isFirst) throws XPathException {


        // Make the node we are testing the context node,
        // with context position and context size set to 1

        ManualIterator si = new ManualIterator(node);
        xc.setCurrentIterator(si);

        StringCollator collation = keydef.getCollation();
        int implicitTimezone = xc.getImplicitTimezone();

        // Evaluate the "use" expression against this context node

        Expression use = keydef.getUse();
        SequenceIterator useval = use.iterate(xc);
        if (keydef.isComposite()) {
            List amks = new ArrayList(4);
            AtomicValue keyVal;
            while ((keyVal = (AtomicValue) useval.next()) != null) {
                amks.add(getCollationKey(keyVal, collation, implicitTimezone));
            }
            addEntry(new CompositeAtomicMatchKey(amks), node, isFirst);
        } else {
            AtomicValue keyVal;
            while ((keyVal = (AtomicValue) useval.next()) != null) {
                if (keyVal.isNaN()) {
                    continue;
                }
                UType actualUType = keyVal.getUType();
                if (!keyTypesPresent.subsumes(actualUType)) {
                    keyTypesPresent = keyTypesPresent.union(actualUType);
                }
                AtomicMatchKey amk = getCollationKey(keyVal, collation, implicitTimezone);
                if (actualUType.equals(UType.UNTYPED_ATOMIC) && keydef.isConvertUntypedToOther()) {
                    if (untypedKeys == null) {
                        untypedKeys = new ArrayList(20);
                    }
                    untypedKeys.add((UntypedAtomicValue)keyVal);
                }
                addEntry(amk, node, isFirst);
            }
        }

    }

    private void addEntry(AtomicMatchKey val, NodeInfo curr, boolean isFirst) {
        List nodes = index.get(val);
        if (nodes == null) {
            // this is the first node with this key value
            nodes = new ArrayList(4);
            index.put(val, nodes);
            nodes.add(curr);
        } else {
            // this is not the first node with this key value.
            // add the node to the list of nodes for this key,
            // unless it's already there
            if (isFirst) {
                // if this is the first index definition that we're processing,
                // then this node must be after all existing nodes in document
                // order, or the same node as the last existing node
                if (nodes.get(nodes.size() - 1) != curr) {
                    nodes.add(curr);
                }
            } else {
                // otherwise, we need to insert the node at the correct
                // position in document order. This code does an insertion sort:
                // not ideal for performance, but it's very unusual to have more than
                // one key definition for a key. We start looking at the end because
                // it's most likely that the new node will come after all the others.
                // See bug 2092 in saxonica.plan.io
                LocalOrderComparer comparer = LocalOrderComparer.getInstance();
                boolean found = false;
                for (int i=nodes.size()-1; i>=0; i--) {
                    int d = comparer.compare(curr, nodes.get(i));
                    if (d>=0) {
                        if (d==0) {
                            // node already in list; do nothing
                        } else {
                            // add the node at this position
                            nodes.add(i+1, curr);
                        }
                        found = true;
                        break;
                    }
                    // else continue round the loop
                }
                // if we're still here, add the new node at the start
                if (!found) {
                    nodes.add(0, curr);
                }
            }
        }
    }

    /**
     * Re-index untyped atomic values after conversion to a specific type. This
     * happens when the "convertUntypedToOther" option is set (typically because this
     * index is used to support a general comparison), and the sought value is of a type
     * other that string or untyped atomic. We go through the index finding all untyped
     * atomic values, converting each one to the sought type, and adding it to the index under
     * this type.
     * @param type the type to which untyped atomic values should be converted
     * @throws XPathException if conversion of any untyped atomic value to the requested key type fails
     */

    public void reindexUntypedValues(BuiltInAtomicType type) throws XPathException {
        UType uType = type.getUType();
        if (UType.STRING_LIKE.subsumes(uType)) {
            return;
        }
        if (UType.NUMERIC.subsumes(uType)) {
            type = BuiltInAtomicType.DOUBLE;
            uType = UType.DOUBLE;
        }
        StringConverter converter = type.getStringConverter(rules);
        for (UntypedAtomicValue v : untypedKeys) {
            AtomicMatchKey uk = getCollationKey(v, collation, implicitTimezone);
            List nodes = index.get(uk);
            AtomicValue convertedValue = converter.convertString(v.getStringValueCS()).asAtomic();
            AtomicMatchKey amk = getCollationKey(convertedValue, collation, implicitTimezone);
            for (NodeInfo node : nodes) {
                addEntry(amk, node, false);
            }
        }

    }

    /**
     * Ask whether the index is empty
     * @return true if the index is empty
     */

    public boolean isEmpty() {
        return index.isEmpty();
    }

    /**
     * Get the nodes with a given key value
     *
     * @param soughtValue The required key value
     * @return a list of the selected nodes, always in document order with no duplicates, or null
     * to represent an empty list
     * @throws XPathException if a dynamic error is encountered
     */

    public List get(AtomicValue soughtValue) throws XPathException {
        if (untypedKeys != null && !keyTypesConvertedFromUntyped.subsumes(soughtValue.getUType())) {
            reindexUntypedValues(soughtValue.getPrimitiveType());
        }
        return index.get(getCollationKey(soughtValue, collation, implicitTimezone));
    }

    /**
     * Get the nodes with a given composite key value
     *
     * @param soughtValue The required composite key value
     * @return a list of the selected nodes, always in document order with no duplicates, or null
     * to represent an empty list
     * @throws XPathException if a dynamic error is encountered
     */

    public List getComposite(SequenceIterator soughtValue) throws XPathException {
        List amks = new ArrayList(4);
        AtomicValue keyVal;
        while ((keyVal = (AtomicValue) soughtValue.next()) != null) {
            amks.add(getCollationKey(keyVal, collation, implicitTimezone));
        }
        return index.get(new CompositeAtomicMatchKey(amks));
    }

    private static AtomicMatchKey getCollationKey(AtomicValue value, StringCollator collation, int implicitTimezone)
            throws XPathException {
        if (UType.STRING_LIKE.subsumes(value.getUType())) {
            if (collation == null) {
                return new CodepointMatchKey(value.getStringValue());
            } else {
                return collation.getCollationKey(value.getStringValue());
            }
        } else {
            return value.getXPathComparable(false, collation, implicitTimezone);
        }
    }

    private class CompositeAtomicMatchKey implements AtomicMatchKey {

        private List keys;

        public CompositeAtomicMatchKey(List keys) {
            this.keys = keys;
        }

        /**
         * Get an atomic value that encapsulates this match key. Needed to support the collation-key() function.
         *
         * @return an atomic value that encapsulates this match key
         */
        public AtomicValue asAtomic() {
            throw new UnsupportedOperationException();
        }

        @Override
        public boolean equals(Object obj) {
            if (obj instanceof CompositeAtomicMatchKey &&
                    ((CompositeAtomicMatchKey)obj).keys.size() == keys.size()) {
                List keys2 = ((CompositeAtomicMatchKey)obj).keys;
                for (int i=0; i




© 2015 - 2025 Weber Informatics LLC | Privacy Policy