All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.phoenix.compile.JoinCompiler Maven / Gradle / Ivy

There is a newer version: 5.1.0-HBase-2.0.0.2
Show newest version
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.phoenix.compile;

import static org.apache.phoenix.schema.PTable.QualifierEncodingScheme.NON_ENCODED_QUALIFIERS;
import static org.apache.phoenix.schema.PTable.ImmutableStorageScheme.ONE_CELL_PER_COLUMN;

import java.sql.SQLException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.ListIterator;
import java.util.Map;
import java.util.Set;

import org.apache.hadoop.hbase.client.Scan;
import org.apache.hadoop.hbase.util.Pair;
import org.apache.phoenix.exception.SQLExceptionCode;
import org.apache.phoenix.exception.SQLExceptionInfo;
import org.apache.phoenix.expression.AndExpression;
import org.apache.phoenix.expression.CoerceExpression;
import org.apache.phoenix.expression.Expression;
import org.apache.phoenix.expression.LiteralExpression;
import org.apache.phoenix.expression.function.CountAggregateFunction;
import org.apache.phoenix.jdbc.PhoenixConnection;
import org.apache.phoenix.jdbc.PhoenixStatement;
import org.apache.phoenix.parse.AliasedNode;
import org.apache.phoenix.parse.AndParseNode;
import org.apache.phoenix.parse.BindTableNode;
import org.apache.phoenix.parse.BooleanParseNodeVisitor;
import org.apache.phoenix.parse.ColumnDef;
import org.apache.phoenix.parse.ColumnParseNode;
import org.apache.phoenix.parse.ComparisonParseNode;
import org.apache.phoenix.parse.ConcreteTableNode;
import org.apache.phoenix.parse.DerivedTableNode;
import org.apache.phoenix.parse.EqualParseNode;
import org.apache.phoenix.parse.HintNode;
import org.apache.phoenix.parse.HintNode.Hint;
import org.apache.phoenix.parse.IndexExpressionParseNodeRewriter;
import org.apache.phoenix.parse.JoinTableNode;
import org.apache.phoenix.parse.JoinTableNode.JoinType;
import org.apache.phoenix.parse.NamedTableNode;
import org.apache.phoenix.parse.OrderByNode;
import org.apache.phoenix.parse.ParseNode;
import org.apache.phoenix.parse.ParseNodeFactory;
import org.apache.phoenix.parse.ParseNodeRewriter;
import org.apache.phoenix.parse.SelectStatement;
import org.apache.phoenix.parse.StatelessTraverseAllParseNodeVisitor;
import org.apache.phoenix.parse.TableName;
import org.apache.phoenix.parse.TableNode;
import org.apache.phoenix.parse.TableNodeVisitor;
import org.apache.phoenix.parse.TableWildcardParseNode;
import org.apache.phoenix.parse.UDFParseNode;
import org.apache.phoenix.parse.WildcardParseNode;
import org.apache.phoenix.schema.ColumnNotFoundException;
import org.apache.phoenix.schema.ColumnRef;
import org.apache.phoenix.schema.LocalIndexDataColumnRef;
import org.apache.phoenix.schema.MetaDataEntityNotFoundException;
import org.apache.phoenix.schema.PColumn;
import org.apache.phoenix.schema.PName;
import org.apache.phoenix.schema.PNameFactory;
import org.apache.phoenix.schema.PTable;
import org.apache.phoenix.schema.PTable.IndexType;
import org.apache.phoenix.schema.PTable.QualifierEncodingScheme;
import org.apache.phoenix.schema.PTable.ImmutableStorageScheme;
import org.apache.phoenix.schema.PTableImpl;
import org.apache.phoenix.schema.PTableType;
import org.apache.phoenix.schema.ProjectedColumn;
import org.apache.phoenix.schema.SortOrder;
import org.apache.phoenix.schema.TableRef;
import org.apache.phoenix.schema.types.PBoolean;
import org.apache.phoenix.schema.types.PDataType;
import org.apache.phoenix.schema.types.PDate;
import org.apache.phoenix.schema.types.PDecimal;
import org.apache.phoenix.schema.types.PDouble;
import org.apache.phoenix.schema.types.PInteger;
import org.apache.phoenix.schema.types.PLong;
import org.apache.phoenix.schema.types.PSmallint;
import org.apache.phoenix.schema.types.PTimestamp;
import org.apache.phoenix.schema.types.PTinyint;
import org.apache.phoenix.schema.types.PVarbinary;
import org.apache.phoenix.schema.types.PVarchar;
import org.apache.phoenix.util.EncodedColumnsUtil;
import org.apache.phoenix.util.IndexUtil;
import org.apache.phoenix.util.SchemaUtil;

import com.google.common.base.Preconditions;
import com.google.common.collect.Lists;
import com.google.common.collect.Sets;


public class JoinCompiler {

    public enum ColumnRefType {
        JOINLOCAL,
        GENERAL,
    }

    private final PhoenixStatement statement;
    private final SelectStatement select;
    private final ColumnResolver origResolver;
    private final boolean useStarJoin;
    private final Map columnRefs;


    private JoinCompiler(PhoenixStatement statement, SelectStatement select, ColumnResolver resolver) {
        this.statement = statement;
        this.select = select;
        this.origResolver = resolver;
        this.useStarJoin = !select.getHint().hasHint(Hint.NO_STAR_JOIN);
        this.columnRefs = new HashMap();
    }

    public static JoinTable compile(PhoenixStatement statement, SelectStatement select, ColumnResolver resolver) throws SQLException {
        JoinCompiler compiler = new JoinCompiler(statement, select, resolver);
        JoinTableConstructor constructor = compiler.new JoinTableConstructor();
        Pair> res = select.getFrom().accept(constructor);
        JoinTable joinTable = res.getSecond() == null ? compiler.new JoinTable(res.getFirst()) : compiler.new JoinTable(res.getFirst(), res.getSecond());
        if (select.getWhere() != null) {
            joinTable.addFilter(select.getWhere());
        }

        ColumnRefParseNodeVisitor generalRefVisitor = new ColumnRefParseNodeVisitor(resolver, statement.getConnection());
        ColumnRefParseNodeVisitor joinLocalRefVisitor = new ColumnRefParseNodeVisitor(resolver, statement.getConnection());
        ColumnRefParseNodeVisitor prefilterRefVisitor = new ColumnRefParseNodeVisitor(resolver, statement.getConnection());

        joinTable.pushDownColumnRefVisitors(generalRefVisitor, joinLocalRefVisitor, prefilterRefVisitor);

        for (AliasedNode node : select.getSelect()) {
            node.getNode().accept(generalRefVisitor);
        }
        if (select.getGroupBy() != null) {
            for (ParseNode node : select.getGroupBy()) {
                node.accept(generalRefVisitor);
            }
        }
        if (select.getHaving() != null) {
            select.getHaving().accept(generalRefVisitor);
        }
        if (select.getOrderBy() != null) {
            for (OrderByNode node : select.getOrderBy()) {
                node.getNode().accept(generalRefVisitor);
            }
        }

        for (ColumnRef ref : generalRefVisitor.getColumnRefMap().keySet()) {
            compiler.columnRefs.put(ref, ColumnRefType.GENERAL);
        }
        for (ColumnRef ref : joinLocalRefVisitor.getColumnRefMap().keySet()) {
            if (!compiler.columnRefs.containsKey(ref))
                compiler.columnRefs.put(ref, ColumnRefType.JOINLOCAL);
        }

        return joinTable;
    }

    private class JoinTableConstructor implements TableNodeVisitor>> {

        private TableRef resolveTable(String alias, TableName name) throws SQLException {
            if (alias != null)
                return origResolver.resolveTable(null, alias);

            return origResolver.resolveTable(name.getSchemaName(), name.getTableName());
        }

        @Override
        public Pair> visit(BindTableNode boundTableNode) throws SQLException {
            TableRef tableRef = resolveTable(boundTableNode.getAlias(), boundTableNode.getName());
            List selectNodes = extractFromSelect(select.getSelect(), tableRef, origResolver);
            Table table = new Table(boundTableNode, Collections.emptyList(), boundTableNode.getTableSamplingRate(), selectNodes, tableRef);
            return new Pair>(table, null);
        }

        @Override
        public Pair> visit(JoinTableNode joinNode) throws SQLException {
            Pair> lhs = joinNode.getLHS().accept(this);
            Pair> rhs = joinNode.getRHS().accept(this);
            JoinTable joinTable = rhs.getSecond() == null ? new JoinTable(rhs.getFirst()) : new JoinTable(rhs.getFirst(), rhs.getSecond());
            List joinSpecs = lhs.getSecond();
            if (joinSpecs == null) {
                joinSpecs = new ArrayList();
            }
            joinSpecs.add(new JoinSpec(joinNode.getType(), joinNode.getOnNode(), joinTable, joinNode.isSingleValueOnly(), origResolver));

            return new Pair>(lhs.getFirst(), joinSpecs);
        }

        @Override
        public Pair> visit(NamedTableNode namedTableNode)
                throws SQLException {
            TableRef tableRef = resolveTable(namedTableNode.getAlias(), namedTableNode.getName());
            List selectNodes = extractFromSelect(select.getSelect(), tableRef, origResolver);
            Table table = new Table(namedTableNode, namedTableNode.getDynamicColumns(), namedTableNode.getTableSamplingRate(), selectNodes, tableRef);
            return new Pair>(table, null);
        }

        @Override
        public Pair> visit(DerivedTableNode subselectNode)
                throws SQLException {
            TableRef tableRef = resolveTable(subselectNode.getAlias(), null);
            List selectNodes = extractFromSelect(select.getSelect(), tableRef, origResolver);
            Table table = new Table(subselectNode, selectNodes, tableRef);
            return new Pair>(table, null);
        }
    }

    public class JoinTable {
        private final Table table;
        private final List joinSpecs;
        private final List postFilters;
        private final List tables;
        private final List tableRefs;
        private final boolean allLeftJoin;
        private final boolean isPrefilterAccepted;
        private final List prefilterAcceptedTables;

        private JoinTable(Table table) {
            this.table = table;
            this.joinSpecs = Collections.emptyList();
            this.postFilters = Collections.emptyList();
            this.tables = Collections.
singletonList(table); this.tableRefs = Collections.singletonList(table.getTableRef()); this.allLeftJoin = false; this.isPrefilterAccepted = true; this.prefilterAcceptedTables = Collections.emptyList(); } private JoinTable(Table table, List joinSpecs) { this.table = table; this.joinSpecs = joinSpecs; this.postFilters = new ArrayList(); this.tables = new ArrayList
(); this.tableRefs = new ArrayList(); this.tables.add(table); boolean allLeftJoin = true; int lastRightJoinIndex = -1; boolean hasFullJoin = false; for (int i = 0; i < joinSpecs.size(); i++) { JoinSpec joinSpec = joinSpecs.get(i); this.tables.addAll(joinSpec.getJoinTable().getTables()); allLeftJoin = allLeftJoin && joinSpec.getType() == JoinType.Left; hasFullJoin = hasFullJoin || joinSpec.getType() == JoinType.Full; if (joinSpec.getType() == JoinType.Right) { lastRightJoinIndex = i; } } for (Table t : this.tables) { this.tableRefs.add(t.getTableRef()); } this.allLeftJoin = allLeftJoin; this.isPrefilterAccepted = !hasFullJoin && lastRightJoinIndex == -1; this.prefilterAcceptedTables = new ArrayList(); for (int i = lastRightJoinIndex == -1 ? 0 : lastRightJoinIndex; i < joinSpecs.size(); i++) { JoinSpec joinSpec = joinSpecs.get(i); if (joinSpec.getType() != JoinType.Left && joinSpec.getType() != JoinType.Anti && joinSpec.getType() != JoinType.Full) { prefilterAcceptedTables.add(joinSpec); } } } public Table getTable() { return table; } public List getJoinSpecs() { return joinSpecs; } public List
getTables() { return tables; } public List getTableRefs() { return tableRefs; } public boolean isAllLeftJoin() { return allLeftJoin; } public SelectStatement getStatement() { return select; } public ColumnResolver getOriginalResolver() { return origResolver; } public Map getColumnRefs() { return columnRefs; } public ParseNode getPostFiltersCombined() { return combine(postFilters); } public void addFilter(ParseNode filter) throws SQLException { if (joinSpecs.isEmpty()) { table.addFilter(filter); return; } WhereNodeVisitor visitor = new WhereNodeVisitor(origResolver, table, postFilters, Collections.singletonList(table.getTableRef()), isPrefilterAccepted, prefilterAcceptedTables, statement.getConnection()); filter.accept(visitor); } public void pushDownColumnRefVisitors(ColumnRefParseNodeVisitor generalRefVisitor, ColumnRefParseNodeVisitor joinLocalRefVisitor, ColumnRefParseNodeVisitor prefilterRefVisitor) throws SQLException { for (ParseNode node : table.getPreFilters()) { node.accept(prefilterRefVisitor); } for (ParseNode node : table.getPostFilters()) { node.accept(generalRefVisitor); } for (ParseNode node : postFilters) { node.accept(generalRefVisitor); } for (JoinSpec joinSpec : joinSpecs) { JoinTable joinTable = joinSpec.getJoinTable(); boolean hasSubJoin = !joinTable.getJoinSpecs().isEmpty(); for (EqualParseNode node : joinSpec.getOnConditions()) { node.getLHS().accept(generalRefVisitor); if (hasSubJoin) { node.getRHS().accept(generalRefVisitor); } else { node.getRHS().accept(joinLocalRefVisitor); } } joinTable.pushDownColumnRefVisitors(generalRefVisitor, joinLocalRefVisitor, prefilterRefVisitor); } } public Expression compilePostFilterExpression(StatementContext context, Table table) throws SQLException { List filtersCombined = Lists. newArrayList(postFilters); if (table != null) { filtersCombined.addAll(table.getPostFilters()); } return JoinCompiler.compilePostFilterExpression(context, filtersCombined); } /** * Returns a boolean vector indicating whether the evaluation of join expressions * can be evaluated at an early stage if the input JoinSpec can be taken as a * star join. Otherwise returns null. * @return a boolean vector for a star join; or null for non star join. */ public boolean[] getStarJoinVector() { int count = joinSpecs.size(); if (!table.isFlat() || (!useStarJoin && count > 1 && joinSpecs.get(count - 1).getType() != JoinType.Left && joinSpecs.get(count - 1).getType() != JoinType.Semi && joinSpecs.get(count - 1).getType() != JoinType.Anti && !joinSpecs.get(count - 1).isSingleValueOnly())) return null; boolean[] vector = new boolean[count]; for (int i = 0; i < count; i++) { JoinSpec joinSpec = joinSpecs.get(i); if (joinSpec.getType() != JoinType.Left && joinSpec.getType() != JoinType.Inner && joinSpec.getType() != JoinType.Semi && joinSpec.getType() != JoinType.Anti) return null; vector[i] = true; Iterator iter = joinSpec.getDependencies().iterator(); while (vector[i] == true && iter.hasNext()) { TableRef tableRef = iter.next(); if (!tableRef.equals(table.getTableRef())) { vector[i] = false; } } } return vector; } public JoinTable getSubJoinTableWithoutPostFilters() { return joinSpecs.size() > 1 ? new JoinTable(table, joinSpecs.subList(0, joinSpecs.size() - 1)) : new JoinTable(table); } public SelectStatement getAsSingleSubquery(SelectStatement query, boolean asSubquery) throws SQLException { assert (isFlat(query)); if (asSubquery) return query; return NODE_FACTORY.select(select, query.getFrom(), query.getWhere()); } public boolean hasPostReference() { for (Table table : tables) { if (table.isWildCardSelect()) { return true; } } for (Map.Entry e : columnRefs.entrySet()) { if (e.getValue() == ColumnRefType.GENERAL && tableRefs.contains(e.getKey().getTableRef())) { return true; } } return false; } public boolean hasFilters() { if (!postFilters.isEmpty()) return true; if (isPrefilterAccepted && table.hasFilters()) return true; for (JoinSpec joinSpec : prefilterAcceptedTables) { if (joinSpec.getJoinTable().hasFilters()) return true; } return false; } } public class JoinSpec { private final JoinType type; private final List onConditions; private final JoinTable joinTable; private final boolean singleValueOnly; private Set dependencies; private OnNodeVisitor onNodeVisitor; private JoinSpec(JoinType type, ParseNode onNode, JoinTable joinTable, boolean singleValueOnly, ColumnResolver resolver) throws SQLException { this.type = type; this.onConditions = new ArrayList(); this.joinTable = joinTable; this.singleValueOnly = singleValueOnly; this.dependencies = new HashSet(); this.onNodeVisitor = new OnNodeVisitor(resolver, onConditions, dependencies, joinTable, statement.getConnection()); if (onNode != null) { onNode.accept(this.onNodeVisitor); } } public void addOnCondition(ParseNode node) throws SQLException { node.accept(onNodeVisitor); } public JoinType getType() { return type; } public List getOnConditions() { return onConditions; } public JoinTable getJoinTable() { return joinTable; } public boolean isSingleValueOnly() { return singleValueOnly; } public Set getDependencies() { return dependencies; } public Pair, List> compileJoinConditions(StatementContext lhsCtx, StatementContext rhsCtx, boolean sortExpressions) throws SQLException { if (onConditions.isEmpty()) { return new Pair, List>( Collections. singletonList(LiteralExpression.newConstant(1)), Collections. singletonList(LiteralExpression.newConstant(1))); } List> compiled = Lists.> newArrayListWithExpectedSize(onConditions.size()); ExpressionCompiler lhsCompiler = new ExpressionCompiler(lhsCtx); ExpressionCompiler rhsCompiler = new ExpressionCompiler(rhsCtx); for (EqualParseNode condition : onConditions) { lhsCompiler.reset(); Expression left = condition.getLHS().accept(lhsCompiler); rhsCompiler.reset(); Expression right = condition.getRHS().accept(rhsCompiler); PDataType toType = getCommonType(left.getDataType(), right.getDataType()); if (left.getDataType() != toType || left.getSortOrder() == SortOrder.DESC) { left = CoerceExpression.create(left, toType, SortOrder.ASC, left.getMaxLength()); } if (right.getDataType() != toType || right.getSortOrder() == SortOrder.DESC) { right = CoerceExpression.create(right, toType, SortOrder.ASC, right.getMaxLength()); } compiled.add(new Pair(left, right)); } if (sortExpressions) { Collections.sort(compiled, new Comparator>() { @Override public int compare(Pair o1, Pair o2) { Expression e1 = o1.getFirst(); Expression e2 = o2.getFirst(); boolean isFixed1 = e1.getDataType().isFixedWidth(); boolean isFixed2 = e2.getDataType().isFixedWidth(); boolean isFixedNullable1 = e1.isNullable() &&isFixed1; boolean isFixedNullable2 = e2.isNullable() && isFixed2; if (isFixedNullable1 == isFixedNullable2) { if (isFixed1 == isFixed2) { return 0; } else if (isFixed1) { return -1; } else { return 1; } } else if (isFixedNullable1) { return 1; } else { return -1; } } }); } List lConditions = Lists. newArrayListWithExpectedSize(compiled.size()); List rConditions = Lists. newArrayListWithExpectedSize(compiled.size()); for (Pair pair : compiled) { lConditions.add(pair.getFirst()); rConditions.add(pair.getSecond()); } return new Pair, List>(lConditions, rConditions); } private PDataType getCommonType(PDataType lType, PDataType rType) throws SQLException { if (lType == rType) return lType; if (!lType.isComparableTo(rType)) throw new SQLExceptionInfo.Builder(SQLExceptionCode.TYPE_MISMATCH) .setMessage("On-clause LHS expression and RHS expression must be comparable. LHS type: " + lType + ", RHS type: " + rType) .build().buildException(); if ((lType == null || lType.isCoercibleTo(PTinyint.INSTANCE)) && (rType == null || rType.isCoercibleTo(PTinyint.INSTANCE))) { return lType == null ? rType : lType; // to preserve UNSIGNED type } if ((lType == null || lType.isCoercibleTo(PSmallint.INSTANCE)) && (rType == null || rType.isCoercibleTo(PSmallint.INSTANCE))) { return lType == null ? rType : lType; // to preserve UNSIGNED type } if ((lType == null || lType.isCoercibleTo(PInteger.INSTANCE)) && (rType == null || rType.isCoercibleTo(PInteger.INSTANCE))) { return lType == null ? rType : lType; // to preserve UNSIGNED type } if ((lType == null || lType.isCoercibleTo(PLong.INSTANCE)) && (rType == null || rType.isCoercibleTo(PLong.INSTANCE))) { return lType == null ? rType : lType; // to preserve UNSIGNED type } if ((lType == null || lType.isCoercibleTo(PDouble.INSTANCE)) && (rType == null || rType.isCoercibleTo(PDouble.INSTANCE))) { return lType == null ? rType : lType; // to preserve UNSIGNED type } if ((lType == null || lType.isCoercibleTo(PDecimal.INSTANCE)) && (rType == null || rType.isCoercibleTo(PDecimal.INSTANCE))) { return PDecimal.INSTANCE; } if ((lType == null || lType.isCoercibleTo(PDate.INSTANCE)) && (rType == null || rType.isCoercibleTo(PDate.INSTANCE))) { return lType == null ? rType : lType; } if ((lType == null || lType.isCoercibleTo(PTimestamp.INSTANCE)) && (rType == null || rType.isCoercibleTo(PTimestamp.INSTANCE))) { return lType == null ? rType : lType; } if ((lType == null || lType.isCoercibleTo(PVarchar.INSTANCE)) && (rType == null || rType.isCoercibleTo(PVarchar.INSTANCE))) { return PVarchar.INSTANCE; } if ((lType == null || lType.isCoercibleTo(PBoolean.INSTANCE)) && (rType == null || rType.isCoercibleTo(PBoolean.INSTANCE))) { return PBoolean.INSTANCE; } return PVarbinary.INSTANCE; } } public class Table { private final TableNode tableNode; private final List dynamicColumns; private final Double tableSamplingRate; private final SelectStatement subselect; private final TableRef tableRef; private final List selectNodes; // all basic nodes related to this table, no aggregation. private final List preFilters; private final List postFilters; private final boolean isPostFilterConvertible; private Table(TableNode tableNode, List dynamicColumns, Double tableSamplingRate, List selectNodes, TableRef tableRef) { this.tableNode = tableNode; this.dynamicColumns = dynamicColumns; this.tableSamplingRate=tableSamplingRate; this.subselect = null; this.tableRef = tableRef; this.selectNodes = selectNodes; this.preFilters = new ArrayList(); this.postFilters = Collections.emptyList(); this.isPostFilterConvertible = false; } private Table(DerivedTableNode tableNode, List selectNodes, TableRef tableRef) throws SQLException { this.tableNode = tableNode; this.dynamicColumns = Collections.emptyList(); this.tableSamplingRate=ConcreteTableNode.DEFAULT_TABLE_SAMPLING_RATE; this.subselect = SubselectRewriter.flatten(tableNode.getSelect(), statement.getConnection()); this.tableRef = tableRef; this.selectNodes = selectNodes; this.preFilters = new ArrayList(); this.postFilters = new ArrayList(); this.isPostFilterConvertible = SubselectRewriter.isPostFilterConvertible(subselect); } public TableNode getTableNode() { return tableNode; } public List getDynamicColumns() { return dynamicColumns; } public Double getTableSamplingRate() { return tableSamplingRate; } public boolean isSubselect() { return subselect != null; } public List getSelectNodes() { return selectNodes; } public List getPreFilters() { return preFilters; } public List getPostFilters() { return postFilters; } public TableRef getTableRef() { return tableRef; } public void addFilter(ParseNode filter) { if (!isSubselect() || isPostFilterConvertible) { preFilters.add(filter); } else { postFilters.add(filter); } } public ParseNode getPreFiltersCombined() { return combine(preFilters); } public Expression compilePostFilterExpression(StatementContext context) throws SQLException { return JoinCompiler.compilePostFilterExpression(context, postFilters); } public SelectStatement getAsSubquery(List orderBy) throws SQLException { if (isSubselect()) return SubselectRewriter.applyOrderBy( SubselectRewriter.applyPostFilters(subselect, preFilters, tableNode.getAlias()), orderBy, tableNode.getAlias(), tableNode); return NODE_FACTORY.select(tableNode, select.getHint(), false, selectNodes, getPreFiltersCombined(), null, null, orderBy, null, null, 0, false, select.hasSequence(), Collections. emptyList(), select.getUdfParseNodes()); } public boolean hasFilters() { return isSubselect() ? (!postFilters.isEmpty() || subselect.getWhere() != null || subselect.getHaving() != null) : !preFilters.isEmpty(); } public boolean isFlat() { return subselect == null || JoinCompiler.isFlat(subselect); } protected boolean isWildCardSelect() { return (selectNodes.size() == 1 && selectNodes.get(0).getNode() instanceof TableWildcardParseNode); } public void projectColumns(Scan scan) { assert(!isSubselect()); if (isWildCardSelect()) { scan.getFamilyMap().clear(); return; } for (ColumnRef columnRef : columnRefs.keySet()) { if (columnRef.getTableRef().equals(tableRef) && !SchemaUtil.isPKColumn(columnRef.getColumn()) && !(columnRef instanceof LocalIndexColumnRef)) { EncodedColumnsUtil.setColumns(columnRef.getColumn(), tableRef.getTable(), scan); } } } public PTable createProjectedTable(boolean retainPKColumns, StatementContext context) throws SQLException { assert(!isSubselect()); List sourceColumns = new ArrayList(); PTable table = tableRef.getTable(); if (retainPKColumns) { for (PColumn column : table.getPKColumns()) { sourceColumns.add(new ColumnRef(tableRef, column.getPosition())); } } if (isWildCardSelect()) { for (PColumn column : table.getColumns()) { if (!retainPKColumns || !SchemaUtil.isPKColumn(column)) { sourceColumns.add(new ColumnRef(tableRef, column.getPosition())); } } } else { for (Map.Entry e : columnRefs.entrySet()) { ColumnRef columnRef = e.getKey(); if (columnRef.getTableRef().equals(tableRef) && (!retainPKColumns || !SchemaUtil.isPKColumn(columnRef.getColumn()))) { if (columnRef instanceof LocalIndexColumnRef) { sourceColumns.add(new LocalIndexDataColumnRef(context, IndexUtil.getIndexColumnName(columnRef.getColumn()))); } else { sourceColumns.add(columnRef); } } } } return TupleProjectionCompiler.createProjectedTable(tableRef, sourceColumns, retainPKColumns); } public PTable createProjectedTable(RowProjector rowProjector) throws SQLException { assert(isSubselect()); TableRef tableRef = FromCompiler.getResolverForCompiledDerivedTable(statement.getConnection(), this.tableRef, rowProjector).getTables().get(0); List sourceColumns = new ArrayList(); PTable table = tableRef.getTable(); for (PColumn column : table.getColumns()) { sourceColumns.add(new ColumnRef(tableRef, column.getPosition())); } return TupleProjectionCompiler.createProjectedTable(tableRef, sourceColumns, false); } } private static class WhereNodeVisitor extends BooleanParseNodeVisitor { private Table table; private List postFilters; private List selfTableRefs; private boolean isPrefilterAccepted; private List prefilterAcceptedTables; ColumnRefParseNodeVisitor columnRefVisitor; public WhereNodeVisitor(ColumnResolver resolver, Table table, List postFilters, List selfTableRefs, boolean isPrefilterAccepted, List prefilterAcceptedTables, PhoenixConnection connection) { this.table = table; this.postFilters = postFilters; this.selfTableRefs = selfTableRefs; this.isPrefilterAccepted = isPrefilterAccepted; this.prefilterAcceptedTables = prefilterAcceptedTables; this.columnRefVisitor = new ColumnRefParseNodeVisitor(resolver, connection); } @Override protected boolean enterBooleanNode(ParseNode node) throws SQLException { return false; } @Override protected Void leaveBooleanNode(ParseNode node, List l) throws SQLException { columnRefVisitor.reset(); node.accept(columnRefVisitor); ColumnRefParseNodeVisitor.ColumnRefType type = columnRefVisitor.getContentType(selfTableRefs); switch (type) { case NONE: case SELF_ONLY: if (isPrefilterAccepted) { table.addFilter(node); } else { postFilters.add(node); } break; case FOREIGN_ONLY: JoinTable matched = null; for (JoinSpec joinSpec : prefilterAcceptedTables) { if (columnRefVisitor.getContentType(joinSpec.getJoinTable().getTableRefs()) == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY) { matched = joinSpec.getJoinTable(); break; } } if (matched != null) { matched.addFilter(node); } else { postFilters.add(node); } break; default: postFilters.add(node); break; } return null; } @Override protected boolean enterNonBooleanNode(ParseNode node) throws SQLException { return false; } @Override protected Void leaveNonBooleanNode(ParseNode node, List l) throws SQLException { return null; } @Override public boolean visitEnter(AndParseNode node) throws SQLException { return true; } @Override public Void visitLeave(AndParseNode node, List l) throws SQLException { return null; } @Override public Void visitLeave(ComparisonParseNode node, List l) throws SQLException { if (!(node instanceof EqualParseNode)) return leaveBooleanNode(node, l); ListIterator iter = prefilterAcceptedTables.listIterator(prefilterAcceptedTables.size()); while (iter.hasPrevious()) { JoinSpec joinSpec = iter.previous(); if (joinSpec.getType() != JoinType.Inner || joinSpec.isSingleValueOnly()) { continue; } try { joinSpec.addOnCondition(node); return null; } catch (SQLException e) { } } return leaveBooleanNode(node, l); } } private static class OnNodeVisitor extends BooleanParseNodeVisitor { private List onConditions; private Set dependencies; private JoinTable joinTable; private ColumnRefParseNodeVisitor columnRefVisitor; public OnNodeVisitor(ColumnResolver resolver, List onConditions, Set dependencies, JoinTable joinTable, PhoenixConnection connection) { this.onConditions = onConditions; this.dependencies = dependencies; this.joinTable = joinTable; this.columnRefVisitor = new ColumnRefParseNodeVisitor(resolver, connection); } @Override protected boolean enterBooleanNode(ParseNode node) throws SQLException { return false; } @Override protected Void leaveBooleanNode(ParseNode node, List l) throws SQLException { columnRefVisitor.reset(); node.accept(columnRefVisitor); ColumnRefParseNodeVisitor.ColumnRefType type = columnRefVisitor.getContentType(joinTable.getTableRefs()); if (type == ColumnRefParseNodeVisitor.ColumnRefType.NONE || type == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY) { joinTable.addFilter(node); } else { throwAmbiguousJoinConditionException(); } return null; } @Override protected boolean enterNonBooleanNode(ParseNode node) throws SQLException { return false; } @Override protected Void leaveNonBooleanNode(ParseNode node, List l) throws SQLException { return null; } @Override public boolean visitEnter(AndParseNode node) throws SQLException { return true; } @Override public Void visitLeave(AndParseNode node, List l) throws SQLException { return null; } @Override public Void visitLeave(ComparisonParseNode node, List l) throws SQLException { if (!(node instanceof EqualParseNode)) return leaveBooleanNode(node, l); columnRefVisitor.reset(); node.getLHS().accept(columnRefVisitor); ColumnRefParseNodeVisitor.ColumnRefType lhsType = columnRefVisitor.getContentType(joinTable.getTableRefs()); Set lhsTableRefSet = Sets.newHashSet(columnRefVisitor.getTableRefSet()); columnRefVisitor.reset(); node.getRHS().accept(columnRefVisitor); ColumnRefParseNodeVisitor.ColumnRefType rhsType = columnRefVisitor.getContentType(joinTable.getTableRefs()); Set rhsTableRefSet = Sets.newHashSet(columnRefVisitor.getTableRefSet()); if ((lhsType == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY || lhsType == ColumnRefParseNodeVisitor.ColumnRefType.NONE) && (rhsType == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY || rhsType == ColumnRefParseNodeVisitor.ColumnRefType.NONE)) { joinTable.addFilter(node); } else if (lhsType == ColumnRefParseNodeVisitor.ColumnRefType.FOREIGN_ONLY && rhsType == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY) { onConditions.add((EqualParseNode) node); dependencies.addAll(lhsTableRefSet); } else if (rhsType == ColumnRefParseNodeVisitor.ColumnRefType.FOREIGN_ONLY && lhsType == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY) { onConditions.add(NODE_FACTORY.equal(node.getRHS(), node.getLHS())); dependencies.addAll(rhsTableRefSet); } else { throwAmbiguousJoinConditionException(); } return null; } /* * Conditions in the ON clause can only be: * 1) an equal test between a self table expression and a foreign * table expression. * 2) a boolean condition referencing to the self table only. * Otherwise, it can be ambiguous. */ public void throwAmbiguousJoinConditionException() throws SQLException { throw new SQLExceptionInfo.Builder(SQLExceptionCode.AMBIGUOUS_JOIN_CONDITION).build().buildException(); } } private static class LocalIndexColumnRef extends ColumnRef { private final TableRef indexTableRef; public LocalIndexColumnRef(TableRef tableRef, String familyName, String columnName, TableRef indexTableRef) throws MetaDataEntityNotFoundException { super(tableRef, familyName, columnName); this.indexTableRef = indexTableRef; } @Override public TableRef getTableRef() { return indexTableRef; } } private static class ColumnRefParseNodeVisitor extends StatelessTraverseAllParseNodeVisitor { public enum ColumnRefType {NONE, SELF_ONLY, FOREIGN_ONLY, COMPLEX}; private final ColumnResolver resolver; private final PhoenixConnection connection; private final Set tableRefSet; private final Map columnRefMap; public ColumnRefParseNodeVisitor(ColumnResolver resolver, PhoenixConnection connection) { this.resolver = resolver; this.tableRefSet = new HashSet(); this.columnRefMap = new HashMap(); this.connection = connection; } public void reset() { this.tableRefSet.clear(); this.columnRefMap.clear(); } @Override public Void visit(ColumnParseNode node) throws SQLException { ColumnRef columnRef = null; try { columnRef = resolver.resolveColumn(node.getSchemaName(), node.getTableName(), node.getName()); } catch (ColumnNotFoundException e) { // This could be a LocalIndexDataColumnRef. If so, the table name must have // been appended by the IndexStatementRewriter, and we can convert it into. TableRef tableRef = resolver.resolveTable(node.getSchemaName(), node.getTableName()); if (tableRef.getTable().getIndexType() == IndexType.LOCAL) { TableRef parentTableRef = FromCompiler.getResolver( NODE_FACTORY.namedTable(null, TableName.create(tableRef.getTable() .getSchemaName().getString(), tableRef.getTable() .getParentTableName().getString())), connection).resolveTable( tableRef.getTable().getSchemaName().getString(), tableRef.getTable().getParentTableName().getString()); columnRef = new LocalIndexColumnRef(parentTableRef, IndexUtil.getDataColumnFamilyName(node.getName()), IndexUtil.getDataColumnName(node.getName()), tableRef); } else { throw e; } } columnRefMap.put(columnRef, node); tableRefSet.add(columnRef.getTableRef()); return null; } public Set getTableRefSet() { return tableRefSet; } public Map getColumnRefMap() { return columnRefMap; } public ColumnRefType getContentType(List selfTableRefs) { if (tableRefSet.isEmpty()) return ColumnRefType.NONE; ColumnRefType ret = ColumnRefType.NONE; for (TableRef tRef : tableRefSet) { boolean isSelf = selfTableRefs.contains(tRef); switch (ret) { case NONE: ret = isSelf ? ColumnRefType.SELF_ONLY : ColumnRefType.FOREIGN_ONLY; break; case SELF_ONLY: ret = isSelf ? ColumnRefType.SELF_ONLY : ColumnRefType.COMPLEX; break; case FOREIGN_ONLY: ret = isSelf ? ColumnRefType.COMPLEX : ColumnRefType.FOREIGN_ONLY; break; default: // COMPLEX do nothing break; } if (ret == ColumnRefType.COMPLEX) { break; } } return ret; } } // for creation of new statements private static final ParseNodeFactory NODE_FACTORY = new ParseNodeFactory(); private static boolean isFlat(SelectStatement select) { return !select.isJoin() && !select.isAggregate() && !select.isDistinct() && !(select.getFrom() instanceof DerivedTableNode) && select.getLimit() == null && select.getOffset() == null; } private static ParseNode combine(List nodes) { if (nodes.isEmpty()) return null; if (nodes.size() == 1) return nodes.get(0); return NODE_FACTORY.and(nodes); } private List extractFromSelect(List select, TableRef tableRef, ColumnResolver resolver) throws SQLException { List ret = new ArrayList(); ColumnRefParseNodeVisitor visitor = new ColumnRefParseNodeVisitor(resolver, statement.getConnection()); for (AliasedNode aliasedNode : select) { ParseNode node = aliasedNode.getNode(); if (node instanceof TableWildcardParseNode) { TableName tableName = ((TableWildcardParseNode) node).getTableName(); if (tableRef.equals(resolver.resolveTable(tableName.getSchemaName(), tableName.getTableName()))) { ret.clear(); ret.add(aliasedNode); return ret; } continue; } node.accept(visitor); ColumnRefParseNodeVisitor.ColumnRefType type = visitor.getContentType(Collections.singletonList(tableRef)); if (type == ColumnRefParseNodeVisitor.ColumnRefType.SELF_ONLY) { ret.add(aliasedNode); } else if (type == ColumnRefParseNodeVisitor.ColumnRefType.COMPLEX) { for (Map.Entry entry : visitor.getColumnRefMap().entrySet()) { if (entry.getKey().getTableRef().equals(tableRef)) { ret.add(NODE_FACTORY.aliasedNode(null, entry.getValue())); } } } visitor.reset(); } return ret; } private static Expression compilePostFilterExpression(StatementContext context, List postFilters) throws SQLException { if (postFilters.isEmpty()) return null; ExpressionCompiler expressionCompiler = new ExpressionCompiler(context); List expressions = new ArrayList(postFilters.size()); for (ParseNode postFilter : postFilters) { expressionCompiler.reset(); Expression expression = postFilter.accept(expressionCompiler); expressions.add(expression); } if (expressions.size() == 1) return expressions.get(0); return AndExpression.create(expressions); } public static SelectStatement optimize(PhoenixStatement statement, SelectStatement select, final ColumnResolver resolver) throws SQLException { TableRef groupByTableRef = null; TableRef orderByTableRef = null; if (select.getGroupBy() != null && !select.getGroupBy().isEmpty()) { ColumnRefParseNodeVisitor groupByVisitor = new ColumnRefParseNodeVisitor(resolver, statement.getConnection()); for (ParseNode node : select.getGroupBy()) { node.accept(groupByVisitor); } Set set = groupByVisitor.getTableRefSet(); if (set.size() == 1) { groupByTableRef = set.iterator().next(); } } else if (select.getOrderBy() != null && !select.getOrderBy().isEmpty()) { ColumnRefParseNodeVisitor orderByVisitor = new ColumnRefParseNodeVisitor(resolver, statement.getConnection()); for (OrderByNode node : select.getOrderBy()) { node.getNode().accept(orderByVisitor); } Set set = orderByVisitor.getTableRefSet(); if (set.size() == 1) { orderByTableRef = set.iterator().next(); } } JoinTable join = compile(statement, select, resolver); if (groupByTableRef != null || orderByTableRef != null) { QueryCompiler compiler = new QueryCompiler(statement, select, resolver, false); List binds = statement.getParameters(); StatementContext ctx = new StatementContext(statement, resolver, new Scan(), new SequenceManager(statement)); QueryPlan plan = compiler.compileJoinQuery(ctx, binds, join, false, false, null); TableRef table = plan.getTableRef(); if (groupByTableRef != null && !groupByTableRef.equals(table)) { groupByTableRef = null; } if (orderByTableRef != null && !orderByTableRef.equals(table)) { orderByTableRef = null; } } final Map replacement = new HashMap(); for (Table table : join.getTables()) { if (table.isSubselect()) continue; TableRef tableRef = table.getTableRef(); List groupBy = tableRef.equals(groupByTableRef) ? select.getGroupBy() : null; List orderBy = tableRef.equals(orderByTableRef) ? select.getOrderBy() : null; SelectStatement stmt = getSubqueryForOptimizedPlan(select.getHint(), table.getDynamicColumns(), table.getTableSamplingRate(), tableRef, join.getColumnRefs(), table.getPreFiltersCombined(), groupBy, orderBy, table.isWildCardSelect(), select.hasSequence(), select.getUdfParseNodes()); QueryPlan plan = statement.getConnection().getQueryServices().getOptimizer().optimize(statement, stmt); if (!plan.getTableRef().equals(tableRef)) { replacement.put(tableRef, plan.getTableRef()); } } if (replacement.isEmpty()) return select; TableNode from = select.getFrom(); TableNode newFrom = from.accept(new TableNodeVisitor() { private TableRef resolveTable(String alias, TableName name) throws SQLException { if (alias != null) return resolver.resolveTable(null, alias); return resolver.resolveTable(name.getSchemaName(), name.getTableName()); } private TableName getReplacedTableName(TableRef tableRef) { String schemaName = tableRef.getTable().getSchemaName().getString(); return TableName.create(schemaName.length() == 0 ? null : schemaName, tableRef.getTable().getTableName().getString()); } @Override public TableNode visit(BindTableNode boundTableNode) throws SQLException { TableRef tableRef = resolveTable(boundTableNode.getAlias(), boundTableNode.getName()); TableRef replaceRef = replacement.get(tableRef); if (replaceRef == null) return boundTableNode; String alias = boundTableNode.getAlias(); return NODE_FACTORY.bindTable(alias == null ? null : '"' + alias + '"', getReplacedTableName(replaceRef)); } @Override public TableNode visit(JoinTableNode joinNode) throws SQLException { TableNode lhs = joinNode.getLHS(); TableNode rhs = joinNode.getRHS(); TableNode lhsReplace = lhs.accept(this); TableNode rhsReplace = rhs.accept(this); if (lhs == lhsReplace && rhs == rhsReplace) return joinNode; return NODE_FACTORY.join(joinNode.getType(), lhsReplace, rhsReplace, joinNode.getOnNode(), joinNode.isSingleValueOnly()); } @Override public TableNode visit(NamedTableNode namedTableNode) throws SQLException { TableRef tableRef = resolveTable(namedTableNode.getAlias(), namedTableNode.getName()); TableRef replaceRef = replacement.get(tableRef); if (replaceRef == null) return namedTableNode; String alias = namedTableNode.getAlias(); return NODE_FACTORY.namedTable(alias == null ? null : '"' + alias + '"', getReplacedTableName(replaceRef), namedTableNode.getDynamicColumns(), namedTableNode.getTableSamplingRate()); } @Override public TableNode visit(DerivedTableNode subselectNode) throws SQLException { return subselectNode; } }); SelectStatement indexSelect = IndexStatementRewriter.translate(NODE_FACTORY.select(select, newFrom), resolver, replacement); for ( TableRef indexTableRef : replacement.values()) { // replace expressions with corresponding matching columns for functional indexes indexSelect = ParseNodeRewriter.rewrite(indexSelect, new IndexExpressionParseNodeRewriter(indexTableRef.getTable(), indexTableRef.getTableAlias(), statement.getConnection(), indexSelect.getUdfParseNodes())); } return indexSelect; } private static SelectStatement getSubqueryForOptimizedPlan(HintNode hintNode, List dynamicCols, Double tableSamplingRate, TableRef tableRef, Map columnRefs, ParseNode where, List groupBy, List orderBy, boolean isWildCardSelect, boolean hasSequence, Map udfParseNodes) { String schemaName = tableRef.getTable().getSchemaName().getString(); TableName tName = TableName.create(schemaName.length() == 0 ? null : schemaName, tableRef.getTable().getTableName().getString()); List selectList = new ArrayList(); if (isWildCardSelect) { selectList.add(NODE_FACTORY.aliasedNode(null, WildcardParseNode.INSTANCE)); } else { for (ColumnRef colRef : columnRefs.keySet()) { if (colRef.getTableRef().equals(tableRef)) { ParseNode node = NODE_FACTORY.column(tName, '"' + colRef.getColumn().getName().getString() + '"', null); if (groupBy != null) { node = NODE_FACTORY.function(CountAggregateFunction.NAME, Collections.singletonList(node)); } selectList.add(NODE_FACTORY.aliasedNode(null, node)); } } } String tableAlias = tableRef.getTableAlias(); TableNode from = NODE_FACTORY.namedTable(tableAlias == null ? null : '"' + tableAlias + '"', tName, dynamicCols,tableSamplingRate); return NODE_FACTORY.select(from, hintNode, false, selectList, where, groupBy, null, orderBy, null, null, 0, groupBy != null, hasSequence, Collections. emptyList(), udfParseNodes); } public static PTable joinProjectedTables(PTable left, PTable right, JoinType type) throws SQLException { Preconditions.checkArgument(left.getType() == PTableType.PROJECTED); Preconditions.checkArgument(right.getType() == PTableType.PROJECTED); List merged = Lists. newArrayList(); if (type == JoinType.Full) { for (PColumn c : left.getColumns()) { merged.add(new ProjectedColumn(c.getName(), c.getFamilyName(), c.getPosition(), true, ((ProjectedColumn) c).getSourceColumnRef(), SchemaUtil.isPKColumn(c) ? null : c.getName().getBytes())); } } else { merged.addAll(left.getColumns()); } int position = merged.size(); for (PColumn c : right.getColumns()) { if (!SchemaUtil.isPKColumn(c)) { PColumn column = new ProjectedColumn(c.getName(), c.getFamilyName(), position++, type == JoinType.Inner ? c.isNullable() : true, ((ProjectedColumn) c).getSourceColumnRef(), c.getName().getBytes()); merged.add(column); } } if (left.getBucketNum() != null) { merged.remove(0); } return PTableImpl.makePTable(left.getTenantId(), left.getSchemaName(), PNameFactory.newName(SchemaUtil.getTableName(left.getName().getString(), right.getName().getString())), left.getType(), left.getIndexState(), left.getTimeStamp(), left.getSequenceNumber(), left.getPKName(), left.getBucketNum(), merged, left.getParentSchemaName(), left.getParentTableName(), left.getIndexes(), left.isImmutableRows(), Collections. emptyList(), null, null, PTable.DEFAULT_DISABLE_WAL, left.isMultiTenant(), left.getStoreNulls(), left.getViewType(), left.getViewIndexId(), left.getIndexType(), left.rowKeyOrderOptimizable(), left.isTransactional(), left.getUpdateCacheFrequency(), left.getIndexDisableTimestamp(), left.isNamespaceMapped(), left.getAutoPartitionSeqName(), left.isAppendOnlySchema(), ONE_CELL_PER_COLUMN, NON_ENCODED_QUALIFIERS, PTable.EncodedCQCounter.NULL_COUNTER, left.useStatsForParallelization()); } }