All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.phoenix.compile.SubqueryRewriter Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.phoenix.compile;

import java.sql.SQLException;
import java.sql.SQLFeatureNotSupportedException;
import java.util.Collections;
import java.util.List;

import org.apache.hadoop.hbase.CompareOperator;
import org.apache.phoenix.exception.SQLExceptionCode;
import org.apache.phoenix.exception.SQLExceptionInfo;
import org.apache.phoenix.expression.function.DistinctValueAggregateFunction;
import org.apache.phoenix.jdbc.PhoenixConnection;
import org.apache.phoenix.parse.AliasedNode;
import org.apache.phoenix.parse.AndParseNode;
import org.apache.phoenix.parse.AndRewriterBooleanParseNodeVisitor;
import org.apache.phoenix.parse.ArrayAllComparisonNode;
import org.apache.phoenix.parse.ArrayAnyComparisonNode;
import org.apache.phoenix.parse.ColumnParseNode;
import org.apache.phoenix.parse.ComparisonParseNode;
import org.apache.phoenix.parse.CompoundParseNode;
import org.apache.phoenix.parse.DerivedTableNode;
import org.apache.phoenix.parse.ExistsParseNode;
import org.apache.phoenix.parse.HintNode;
import org.apache.phoenix.parse.InParseNode;
import org.apache.phoenix.parse.JoinTableNode.JoinType;
import org.apache.phoenix.parse.LiteralParseNode;
import org.apache.phoenix.parse.OrderByNode;
import org.apache.phoenix.parse.ParseNode;
import org.apache.phoenix.parse.ParseNodeFactory;
import org.apache.phoenix.parse.ParseNodeRewriter;
import org.apache.phoenix.parse.RowValueConstructorParseNode;
import org.apache.phoenix.parse.SelectStatement;
import org.apache.phoenix.parse.StatelessTraverseAllParseNodeVisitor;
import org.apache.phoenix.parse.SubqueryParseNode;
import org.apache.phoenix.parse.TableName;
import org.apache.phoenix.parse.TableNode;
import org.apache.phoenix.schema.ColumnFamilyNotFoundException;
import org.apache.phoenix.schema.ColumnNotFoundException;
import org.apache.phoenix.schema.TableNotFoundException;

import org.apache.phoenix.thirdparty.com.google.common.collect.Lists;

/**
 * Class for rewriting where-clause sub-queries into join queries.
 * 
 * If the where-clause sub-query is one of those top-node conditions (being 
 * the only condition node or direct descendant of AND nodes), we convert the
 * sub-query directly into semi-joins, anti-joins or inner-joins, and meanwhile
 * remove the original condition node from the where clause.
 * Otherwise, we convert the sub-query into left-joins and change the original
 * condition node into a null test of a join table field (ONE if matched, NULL 
 * if not matched).
 */
public class SubqueryRewriter extends ParseNodeRewriter {
    private static final ParseNodeFactory NODE_FACTORY = new ParseNodeFactory();
    
    private final ColumnResolver columnResolver;
    private final PhoenixConnection connection;
    private TableNode tableNode;
    private ParseNode topNode;
    
    public static SelectStatement transform(SelectStatement select, ColumnResolver resolver, PhoenixConnection connection) throws SQLException {
        ParseNode where = select.getWhere();
        if (where == null)
            return select;
        
        SubqueryRewriter rewriter = new SubqueryRewriter(select, resolver, connection);
        ParseNode normWhere = rewrite(where, rewriter);
        if (normWhere == where)
            return select;
        
        return NODE_FACTORY.select(select, rewriter.tableNode, normWhere);
    }
    
    protected SubqueryRewriter(SelectStatement select, ColumnResolver resolver, PhoenixConnection connection) {
        this.columnResolver = resolver;
        this.connection = connection;
        this.tableNode = select.getFrom();
        this.topNode = null;
    }
    
    @Override
    protected void enterParseNode(ParseNode node) {
        if (topNode == null) {
            topNode = node;
        }
        super.enterParseNode(node);
    }
    
    @Override
    protected ParseNode leaveCompoundNode(CompoundParseNode node, List children, ParseNodeRewriter.CompoundNodeFactory factory) {
        if (topNode == node) {
            topNode = null;
        }
        
        return super.leaveCompoundNode(node, children, factory);
    }

    @Override
    public boolean visitEnter(AndParseNode node) throws SQLException {
        return true;
    }

    @Override
    public ParseNode visitLeave(AndParseNode node, List l) throws SQLException {
        return leaveCompoundNode(node, l, new CompoundNodeFactory() {
            @Override
            public ParseNode createNode(List children) {
                if (children.isEmpty()) {
                    return null;
                }
                if (children.size() == 1) {
                    return children.get(0);
                }
                return NODE_FACTORY.and(children);
            }
        });
    }

    /**
     * 
     * {@code
     * Rewrite the In Subquery to semi/anti/left join for both NonCorrelated and Correlated subquery.
     *
     * 1.If the {@link InParseNode} is the only node in where clause or is the ANDed part of the where clause,
     *   then we would rewrite the In Subquery to semi/anti join:
     *   For  NonCorrelated subquery, an example is:
     *    SELECT item_id, name FROM item i WHERE i.item_id IN
     *    (SELECT item_id FROM order o  where o.price > 8)
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  Semi JOIN
     *    (SELECT DISTINCT 1 $35,ITEM_ID $36 FROM order O  WHERE O.PRICE > 8) $34
     *     ON (I.ITEM_ID = $34.$36)
     *
     *   For Correlated subquery, an example is:
     *    SELECT item_id, name FROM item i WHERE i.item_id IN
     *    (SELECT item_id FROM order o  where o.price = i.price)
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  Semi JOIN
     *    (SELECT DISTINCT 1 $3,ITEM_ID $4,O.PRICE $2 FROM order O ) $1
     *    ON ((I.ITEM_ID = $1.$4 AND $1.$2 = I.PRICE))
     *
     * 2.If the {@link InParseNode} is the ORed part of the where clause,then we would rewrite the In Subquery to
     *   Left Join.
     *
     *   For  NonCorrelated subquery, an example is:
     *    SELECT item_id, name FROM item i WHERE i.item_id IN
     *    (SELECT max(item_id) FROM order o  where o.price > 8 group by o.customer_id,o.item_id) or i.discount1 > 10
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  Left JOIN
     *    (SELECT DISTINCT 1 $56, MAX(ITEM_ID) $57 FROM order O  WHERE O.PRICE > 8 GROUP BY O.CUSTOMER_ID,O.ITEM_ID) $55
     *    ON (I.ITEM_ID = $55.$57) WHERE ($55.$56 IS NOT NULL  OR I.DISCOUNT1 > 10)
     *
     *   For  Correlated subquery, an example is:
     *     SELECT item_id, name FROM item i WHERE i.item_id IN
     *     (SELECT max(item_id) FROM order o  where o.price = i.price group by o.customer_id) or i.discount1 > 10;
     *
     *     The above sql would be rewritten as:
     *     SELECT ITEM_ID,NAME FROM item I  Left JOIN
     *     (SELECT DISTINCT 1 $28, MAX(ITEM_ID) $29,O.PRICE $27 FROM order O  GROUP BY O.PRICE,O.CUSTOMER_ID) $26
     *     ON ((I.ITEM_ID = $26.$29 AND $26.$27 = I.PRICE)) WHERE ($26.$28 IS NOT NULL  OR I.DISCOUNT1 > 10)
     * }
     * 
*/ @Override public ParseNode visitLeave(InParseNode inParseNode, List childParseNodes) throws SQLException { boolean isTopNode = topNode == inParseNode; if (isTopNode) { topNode = null; } SubqueryParseNode subqueryParseNode = (SubqueryParseNode) childParseNodes.get(1); SelectStatement subquerySelectStatementToUse = fixSubqueryStatement(subqueryParseNode.getSelectNode()); String subqueryTableTempAlias = ParseNodeFactory.createTempAlias(); JoinConditionExtractor joinConditionExtractor = new JoinConditionExtractor( subquerySelectStatementToUse, columnResolver, connection, subqueryTableTempAlias); List newSubquerySelectAliasedNodes = null; ParseNode extractedJoinConditionParseNode = null; int extractedSelectAliasNodeCount = 0; List oldSubqueryAliasedNodes = subquerySelectStatementToUse.getSelect(); ParseNode whereParseNodeAfterExtract = subquerySelectStatementToUse.getWhere() == null ? null : subquerySelectStatementToUse.getWhere().accept(joinConditionExtractor); if (whereParseNodeAfterExtract == subquerySelectStatementToUse.getWhere()) { /** * It is an NonCorrelated subquery. */ newSubquerySelectAliasedNodes = Lists. newArrayListWithExpectedSize( oldSubqueryAliasedNodes.size() + 1); newSubquerySelectAliasedNodes.add( NODE_FACTORY.aliasedNode( ParseNodeFactory.createTempAlias(), LiteralParseNode.ONE)); this.addNewAliasedNodes(newSubquerySelectAliasedNodes, oldSubqueryAliasedNodes); subquerySelectStatementToUse = NODE_FACTORY.select( subquerySelectStatementToUse, !inParseNode.isSubqueryDistinct(), newSubquerySelectAliasedNodes, whereParseNodeAfterExtract); } else { /** * It is an Correlated subquery. */ List extractedAdditionalSelectAliasNodes = joinConditionExtractor.getAdditionalSubselectSelectAliasedNodes(); extractedSelectAliasNodeCount = extractedAdditionalSelectAliasNodes.size(); newSubquerySelectAliasedNodes = Lists. newArrayListWithExpectedSize( oldSubqueryAliasedNodes.size() + 1 + extractedAdditionalSelectAliasNodes.size()); newSubquerySelectAliasedNodes.add(NODE_FACTORY.aliasedNode( ParseNodeFactory.createTempAlias(), LiteralParseNode.ONE)); this.addNewAliasedNodes(newSubquerySelectAliasedNodes, oldSubqueryAliasedNodes); newSubquerySelectAliasedNodes.addAll(extractedAdditionalSelectAliasNodes); extractedJoinConditionParseNode = joinConditionExtractor.getJoinConditionParseNode(); boolean isAggregate = subquerySelectStatementToUse.isAggregate(); if (!isAggregate) { subquerySelectStatementToUse = NODE_FACTORY.select( subquerySelectStatementToUse, !inParseNode.isSubqueryDistinct(), newSubquerySelectAliasedNodes, whereParseNodeAfterExtract); } else { /** * If exists AggregateFunction,we must add the correlated join condition to both the * groupBy clause and select lists of the subquery. */ List newGroupByParseNodes = this.createNewGroupByParseNodes( extractedAdditionalSelectAliasNodes, subquerySelectStatementToUse); subquerySelectStatementToUse = NODE_FACTORY.select( subquerySelectStatementToUse, !inParseNode.isSubqueryDistinct(), newSubquerySelectAliasedNodes, whereParseNodeAfterExtract, newGroupByParseNodes, true); } } ParseNode joinOnConditionParseNode = getJoinConditionNodeForInSubquery( childParseNodes.get(0), newSubquerySelectAliasedNodes, subqueryTableTempAlias, extractedJoinConditionParseNode, extractedSelectAliasNodeCount); DerivedTableNode subqueryDerivedTableNode = NODE_FACTORY.derivedTable( subqueryTableTempAlias, subquerySelectStatementToUse); JoinType joinType = isTopNode ? (inParseNode.isNegate() ? JoinType.Anti : JoinType.Semi) : JoinType.Left; ParseNode resultWhereParseNode = isTopNode ? null : NODE_FACTORY.isNull( NODE_FACTORY.column( NODE_FACTORY.table(null, subqueryTableTempAlias), newSubquerySelectAliasedNodes.get(0).getAlias(), null), !inParseNode.isNegate()); tableNode = NODE_FACTORY.join( joinType, tableNode, subqueryDerivedTableNode, joinOnConditionParseNode, false); return resultWhereParseNode; } /** *
     * {@code
     * Rewrite the Exists Subquery to semi/anti/left join for both NonCorrelated and Correlated subquery.
     *
     * 1.If the {@link ExistsParseNode} is NonCorrelated subquery,the just add LIMIT 1.
     *    an example is:
     *    SELECT item_id, name FROM item i WHERE exists
     *    (SELECT 1 FROM order o  where o.price > 8)
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  WHERE  EXISTS
     *    (SELECT 1 FROM ORDER_TABLE O  WHERE O.PRICE > 8 LIMIT 1)
     *
     *   another example is:
     *   SELECT item_id, name FROM item i WHERE exists
     *   (SELECT 1 FROM order o  where o.price > 8 group by o.customer_id,o.item_id having count(order_id) > 1)
     *    or i.discount1 > 10
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  WHERE
     *    ( EXISTS (SELECT 1 FROM ORDER_TABLE O  WHERE O.PRICE > 8 GROUP BY O.CUSTOMER_ID,O.ITEM_ID HAVING  COUNT(ORDER_ID) > 1 LIMIT 1)
     *    OR I.DISCOUNT1 > 10)
     *
     * 2.If the {@link ExistsParseNode} is Correlated subquery and is the only node in where clause or
     *   is the ANDed part of the where clause, then we would rewrite the Exists Subquery to semi/anti join:
     *   an example is:
     *    SELECT item_id, name FROM item i WHERE exists
     *    (SELECT 1 FROM order o where o.price = i.price and o.quantity = 5 )
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  Semi JOIN
     *    (SELECT DISTINCT 1 $3,O.PRICE $2 FROM ORDER_TABLE O  WHERE O.QUANTITY = 5) $1
     *    ON ($1.$2 = I.PRICE)
     *
     *   another example with AggregateFunction and groupBy is
     *   SELECT item_id, name FROM item i WHERE exists
     *   (SELECT 1 FROM order o  where o.item_id = i.item_id group by customer_id having count(order_id) > 1)
     *
     *    The above sql would be rewritten as:
     *     SELECT ITEM_ID,NAME FROM item I  Semi JOIN
     *     (SELECT DISTINCT 1 $3,O.ITEM_ID $2 FROM order O  GROUP BY O.ITEM_ID,CUSTOMER_ID HAVING  COUNT(ORDER_ID) > 1) $1
     *     ON ($1.$2 = I.ITEM_ID)
     *
     * 3.If the {@link ExistsParseNode} is Correlated subquery and is the ORed part of the where clause,
     *   then we would rewrite the Exists Subquery to Left Join.
     *   an example is:
     *   SELECT item_id, name FROM item i WHERE exists
     *   (SELECT 1 FROM order o  where o.item_id = i.item_id group by customer_id having count(order_id) > 1)
     *   or i.discount1 > 10
     *
     *    The above sql would be rewritten as:
     *    SELECT ITEM_ID,NAME FROM item I  Left JOIN
     *    (SELECT DISTINCT 1 $3,O.ITEM_ID $2 FROM order O  GROUP BY O.ITEM_ID,CUSTOMER_ID HAVING  COUNT(ORDER_ID) > 1) $1
     *    ON ($1.$2 = I.ITEM_ID) WHERE ($1.$3 IS NOT NULL  OR I.DISCOUNT1 > 10)
     * }
     * 
*/ @Override public ParseNode visitLeave( ExistsParseNode existsParseNode, List childParseNodes) throws SQLException { boolean isTopNode = topNode == existsParseNode; if (isTopNode) { topNode = null; } SubqueryParseNode subqueryParseNode = (SubqueryParseNode) childParseNodes.get(0); SelectStatement subquerySelectStatementToUse = fixSubqueryStatement(subqueryParseNode.getSelectNode()); String subqueryTableTempAlias = ParseNodeFactory.createTempAlias(); JoinConditionExtractor joinConditionExtractor = new JoinConditionExtractor( subquerySelectStatementToUse, columnResolver, connection, subqueryTableTempAlias); ParseNode whereParseNodeAfterExtract = subquerySelectStatementToUse.getWhere() == null ? null : subquerySelectStatementToUse.getWhere().accept(joinConditionExtractor); if (whereParseNodeAfterExtract == subquerySelectStatementToUse.getWhere()) { /** * It is non-correlated EXISTS subquery, add LIMIT 1 */ subquerySelectStatementToUse = NODE_FACTORY.select( subquerySelectStatementToUse, NODE_FACTORY.limit(NODE_FACTORY.literal(1))); subqueryParseNode = NODE_FACTORY.subquery(subquerySelectStatementToUse, false); existsParseNode = NODE_FACTORY.exists(subqueryParseNode, existsParseNode.isNegate()); return super.visitLeave( existsParseNode, Collections.singletonList(subqueryParseNode)); } List extractedAdditionalSelectAliasNodes = joinConditionExtractor.getAdditionalSubselectSelectAliasedNodes(); List newSubquerySelectAliasedNodes = Lists.newArrayListWithExpectedSize( extractedAdditionalSelectAliasNodes.size() + 1); /** * Just overwrite original subquery selectAliasNodes. */ newSubquerySelectAliasedNodes.add( NODE_FACTORY.aliasedNode(ParseNodeFactory.createTempAlias(), LiteralParseNode.ONE)); newSubquerySelectAliasedNodes.addAll(extractedAdditionalSelectAliasNodes); boolean isAggregate = subquerySelectStatementToUse.isAggregate(); if (!isAggregate) { subquerySelectStatementToUse = NODE_FACTORY.select( subquerySelectStatementToUse, true, newSubquerySelectAliasedNodes, whereParseNodeAfterExtract); } else { /** * If exists AggregateFunction,we must add the correlated join condition to both the * groupBy clause and select lists of the subquery. */ List newGroupByParseNodes = this.createNewGroupByParseNodes( extractedAdditionalSelectAliasNodes, subquerySelectStatementToUse); subquerySelectStatementToUse = NODE_FACTORY.select( subquerySelectStatementToUse, true, newSubquerySelectAliasedNodes, whereParseNodeAfterExtract, newGroupByParseNodes, true); } ParseNode joinOnConditionParseNode = joinConditionExtractor.getJoinConditionParseNode(); DerivedTableNode subqueryDerivedTableNode = NODE_FACTORY.derivedTable( subqueryTableTempAlias, subquerySelectStatementToUse); JoinType joinType = isTopNode ? (existsParseNode.isNegate() ? JoinType.Anti : JoinType.Semi) : JoinType.Left; ParseNode resultWhereParseNode = isTopNode ? null : NODE_FACTORY.isNull( NODE_FACTORY.column( NODE_FACTORY.table(null, subqueryTableTempAlias), newSubquerySelectAliasedNodes.get(0).getAlias(), null), !existsParseNode.isNegate()); tableNode = NODE_FACTORY.join( joinType, tableNode, subqueryDerivedTableNode, joinOnConditionParseNode, false); return resultWhereParseNode; } @Override public ParseNode visitLeave(ComparisonParseNode node, List l) throws SQLException { boolean isTopNode = topNode == node; if (isTopNode) { topNode = null; } ParseNode secondChild = l.get(1); if (!(secondChild instanceof SubqueryParseNode)) { return super.visitLeave(node, l); } SubqueryParseNode subqueryNode = (SubqueryParseNode) secondChild; SelectStatement subquery = fixSubqueryStatement(subqueryNode.getSelectNode()); String rhsTableAlias = ParseNodeFactory.createTempAlias(); JoinConditionExtractor conditionExtractor = new JoinConditionExtractor(subquery, columnResolver, connection, rhsTableAlias); ParseNode where = subquery.getWhere() == null ? null : subquery.getWhere().accept(conditionExtractor); if (where == subquery.getWhere()) { // non-correlated comparison subquery, add LIMIT 2, expectSingleRow = true subquery = NODE_FACTORY.select(subquery, NODE_FACTORY.limit(NODE_FACTORY.literal(2))); subqueryNode = NODE_FACTORY.subquery(subquery, true); l = Lists.newArrayList(l.get(0), subqueryNode); node = NODE_FACTORY.comparison(node.getFilterOp(), l.get(0), l.get(1)); return super.visitLeave(node, l); } ParseNode rhsNode = null; boolean isGroupby = !subquery.getGroupBy().isEmpty(); boolean isAggregate = subquery.isAggregate(); List aliasedNodes = subquery.getSelect(); if (aliasedNodes.size() == 1) { rhsNode = aliasedNodes.get(0).getNode(); } else { List nodes = Lists. newArrayListWithExpectedSize(aliasedNodes.size()); for (AliasedNode aliasedNode : aliasedNodes) { nodes.add(aliasedNode.getNode()); } rhsNode = NODE_FACTORY.rowValueConstructor(nodes); } List additionalSelectNodes = conditionExtractor.getAdditionalSubselectSelectAliasedNodes(); List selectNodes = Lists.newArrayListWithExpectedSize(additionalSelectNodes.size() + 1); selectNodes.add(NODE_FACTORY.aliasedNode(ParseNodeFactory.createTempAlias(), rhsNode)); selectNodes.addAll(additionalSelectNodes); if (!isAggregate) { subquery = NODE_FACTORY.select(subquery, subquery.isDistinct(), selectNodes, where); } else { List groupbyNodes = this.createNewGroupByParseNodes( additionalSelectNodes, subquery); subquery = NODE_FACTORY.select(subquery, subquery.isDistinct(), selectNodes, where, groupbyNodes, true); } ParseNode onNode = conditionExtractor.getJoinConditionParseNode(); TableNode rhsTable = NODE_FACTORY.derivedTable(rhsTableAlias, subquery); JoinType joinType = isTopNode ? JoinType.Inner : JoinType.Left; ParseNode ret = NODE_FACTORY.comparison(node.getFilterOp(), l.get(0), NODE_FACTORY.column(NODE_FACTORY.table(null, rhsTableAlias), selectNodes.get(0).getAlias(), null)); tableNode = NODE_FACTORY.join(joinType, tableNode, rhsTable, onNode, !isAggregate || isGroupby); return ret; } @Override public ParseNode visitLeave(ArrayAnyComparisonNode node, List l) throws SQLException { List children = leaveArrayComparisonNode(node, l); if (children == l) return super.visitLeave(node, l); node = NODE_FACTORY.arrayAny(children.get(0), (ComparisonParseNode) children.get(1)); return node; } @Override public ParseNode visitLeave(ArrayAllComparisonNode node, List l) throws SQLException { List children = leaveArrayComparisonNode(node, l); if (children == l) return super.visitLeave(node, l); node = NODE_FACTORY.arrayAll(children.get(0), (ComparisonParseNode) children.get(1)); return node; } protected List leaveArrayComparisonNode(ParseNode node, List l) throws SQLException { boolean isTopNode = topNode == node; if (isTopNode) { topNode = null; } ParseNode firstChild = l.get(0); if (!(firstChild instanceof SubqueryParseNode)) { return l; } SubqueryParseNode subqueryNode = (SubqueryParseNode) firstChild; SelectStatement subquery = fixSubqueryStatement(subqueryNode.getSelectNode()); String rhsTableAlias = ParseNodeFactory.createTempAlias(); JoinConditionExtractor conditionExtractor = new JoinConditionExtractor(subquery, columnResolver, connection, rhsTableAlias); ParseNode where = subquery.getWhere() == null ? null : subquery.getWhere().accept(conditionExtractor); if (where == subquery.getWhere()) { // non-correlated any/all comparison subquery return l; } ParseNode rhsNode = null; boolean isNonGroupByAggregate = subquery.getGroupBy().isEmpty() && subquery.isAggregate(); List aliasedNodes = subquery.getSelect(); String derivedTableAlias = null; if (!subquery.getGroupBy().isEmpty()) { derivedTableAlias = ParseNodeFactory.createTempAlias(); aliasedNodes = createNewAliasedNodes(aliasedNodes); } if (aliasedNodes.size() == 1) { rhsNode = derivedTableAlias == null ? aliasedNodes.get(0).getNode() : NODE_FACTORY.column(NODE_FACTORY.table(null, derivedTableAlias), aliasedNodes.get(0).getAlias(), null); } else { List nodes = Lists. newArrayListWithExpectedSize(aliasedNodes.size()); for (AliasedNode aliasedNode : aliasedNodes) { nodes.add(derivedTableAlias == null ? aliasedNode.getNode() : NODE_FACTORY.column(NODE_FACTORY.table(null, derivedTableAlias), aliasedNode.getAlias(), null)); } rhsNode = NODE_FACTORY.rowValueConstructor(nodes); } if (!isNonGroupByAggregate) { rhsNode = NODE_FACTORY.function(DistinctValueAggregateFunction.NAME, Collections.singletonList(rhsNode)); } List additionalSelectNodes = conditionExtractor.getAdditionalSubselectSelectAliasedNodes(); List selectNodes = Lists.newArrayListWithExpectedSize(additionalSelectNodes.size() + 1); selectNodes.add(NODE_FACTORY.aliasedNode(ParseNodeFactory.createTempAlias(), rhsNode)); selectNodes.addAll(additionalSelectNodes); List groupbyNodes = Lists.newArrayListWithExpectedSize(additionalSelectNodes.size()); for (AliasedNode aliasedNode : additionalSelectNodes) { groupbyNodes.add(aliasedNode.getNode()); } if (derivedTableAlias == null) { subquery = NODE_FACTORY.select(subquery, false, selectNodes, where, groupbyNodes, true); } else { List derivedTableGroupBy = Lists.newArrayListWithExpectedSize(subquery.getGroupBy().size() + groupbyNodes.size()); derivedTableGroupBy.addAll(groupbyNodes); derivedTableGroupBy.addAll(subquery.getGroupBy()); List derivedTableSelect = Lists.newArrayListWithExpectedSize(aliasedNodes.size() + selectNodes.size() - 1); derivedTableSelect.addAll(aliasedNodes); for (int i = 1; i < selectNodes.size(); i++) { AliasedNode aliasedNode = selectNodes.get(i); String alias = ParseNodeFactory.createTempAlias(); derivedTableSelect.add(NODE_FACTORY.aliasedNode(alias, aliasedNode.getNode())); aliasedNode = NODE_FACTORY.aliasedNode(aliasedNode.getAlias(), NODE_FACTORY.column(NODE_FACTORY.table(null, derivedTableAlias), alias, null)); selectNodes.set(i, aliasedNode); groupbyNodes.set(i - 1, aliasedNode.getNode()); } SelectStatement derivedTableStmt = NODE_FACTORY.select(subquery, subquery.isDistinct(), derivedTableSelect, where, derivedTableGroupBy, true); subquery = NODE_FACTORY.select(NODE_FACTORY.derivedTable(derivedTableAlias, derivedTableStmt), subquery.getHint(), false, selectNodes, null, groupbyNodes, null, Collections. emptyList(), null, null, subquery.getBindCount(), true, false, Collections. emptyList(), subquery.getUdfParseNodes()); } ParseNode onNode = conditionExtractor.getJoinConditionParseNode(); TableNode rhsTable = NODE_FACTORY.derivedTable(rhsTableAlias, subquery); JoinType joinType = isTopNode ? JoinType.Inner : JoinType.Left; tableNode = NODE_FACTORY.join(joinType, tableNode, rhsTable, onNode, false); firstChild = NODE_FACTORY.column(NODE_FACTORY.table(null, rhsTableAlias), selectNodes.get(0).getAlias(), null); if (isNonGroupByAggregate) { firstChild = NODE_FACTORY.upsertStmtArrayNode(Collections.singletonList(firstChild)); } ComparisonParseNode secondChild = (ComparisonParseNode) l.get(1); secondChild = NODE_FACTORY.comparison(secondChild.getFilterOp(), secondChild.getLHS(), NODE_FACTORY.elementRef(Lists.newArrayList(firstChild, NODE_FACTORY.literal(1)))); return Lists.newArrayList(firstChild, secondChild); } private SelectStatement fixSubqueryStatement(SelectStatement select) { if (!select.isUnion()) return select; // Wrap as a derived table. return NODE_FACTORY.select(NODE_FACTORY.derivedTable(ParseNodeFactory.createTempAlias(), select), HintNode.EMPTY_HINT_NODE, false, select.getSelect(), null, null, null, null, null, null, select.getBindCount(), false, false, Collections. emptyList(), select.getUdfParseNodes()); } /** * Create new {@link AliasedNode}s by every {@link ParseNode} in subquerySelectAliasedNodes and generate new aliases * by {@link ParseNodeFactory#createTempAlias}. * and generate new Aliases for subquerySelectAliasedNodes, * @param subquerySelectAliasedNodes * @param addSelectOne * @return */ private List createNewAliasedNodes(List subquerySelectAliasedNodes) { List newAliasedNodes = Lists. newArrayListWithExpectedSize( subquerySelectAliasedNodes.size()); this.addNewAliasedNodes(newAliasedNodes, subquerySelectAliasedNodes); return newAliasedNodes; } /** * Add every {@link ParseNode} in oldSelectAliasedNodes to newSelectAliasedNodes and generate new aliases by * {@link ParseNodeFactory#createTempAlias}. * @param oldSelectAliasedNodes * @param addSelectOne * @return */ private void addNewAliasedNodes(List newSelectAliasedNodes, List oldSelectAliasedNodes) { for (int index = 0; index < oldSelectAliasedNodes.size(); index++) { AliasedNode oldSelectAliasedNode = oldSelectAliasedNodes.get(index); newSelectAliasedNodes.add(NODE_FACTORY.aliasedNode( ParseNodeFactory.createTempAlias(), oldSelectAliasedNode.getNode())); } } /** * Get the join conditions in order to rewrite InSubquery to Join. * @param lhsParseNode * @param rhsSubquerySelectAliasedNodes the first element is {@link LiteralParseNode#ONE}. * @param rhsSubqueryTableAlias * @param extractedJoinConditionParseNode For NonCorrelated subquery, it is null. * @param extractedSelectAliasNodeCount For NonCorrelated subquery, it is 0. * @throws SQLException */ private ParseNode getJoinConditionNodeForInSubquery( ParseNode lhsParseNode, List rhsSubquerySelectAliasedNodes, String rhsSubqueryTableAlias, ParseNode extractedJoinConditionParseNode, int extractedSelectAliasNodeCount) throws SQLException { List lhsParseNodes; if (lhsParseNode instanceof RowValueConstructorParseNode) { lhsParseNodes = ((RowValueConstructorParseNode) lhsParseNode).getChildren(); } else { lhsParseNodes = Collections.singletonList(lhsParseNode); } if (lhsParseNodes.size() != (rhsSubquerySelectAliasedNodes.size() - 1 - extractedSelectAliasNodeCount)) { throw new SQLExceptionInfo.Builder( SQLExceptionCode.SUBQUERY_RETURNS_DIFFERENT_NUMBER_OF_FIELDS) .build().buildException(); } int count = lhsParseNodes.size(); TableName rhsSubqueryTableName = NODE_FACTORY.table(null, rhsSubqueryTableAlias); List joinEqualParseNodes = Lists.newArrayListWithExpectedSize( count + (extractedJoinConditionParseNode == null ? 0: 1)); for (int index = 0; index < count; index++) { /** * The +1 is to skip the first {@link LiteralParseNode#ONE} */ ParseNode rhsNode = NODE_FACTORY.column( rhsSubqueryTableName, rhsSubquerySelectAliasedNodes.get(index + 1).getAlias(), null); joinEqualParseNodes.add(NODE_FACTORY.equal(lhsParseNodes.get(index), rhsNode)); } if(extractedJoinConditionParseNode != null) { joinEqualParseNodes.add(extractedJoinConditionParseNode); } return joinEqualParseNodes.size() == 1 ? joinEqualParseNodes.get(0) : NODE_FACTORY.and(joinEqualParseNodes); } /** * Combine every {@link ParseNode} in extractedAdditionalSelectAliasNodes and GroupBy clause of the * subquerySelectStatementToUse to get new GroupBy ParseNodes. * @param extractedAdditionalSelectAliasNodes * @param subquerySelectStatementToUse * @return */ private List createNewGroupByParseNodes( List extractedAdditionalSelectAliasNodes, SelectStatement subquerySelectStatementToUse) { List newGroupByParseNodes = Lists.newArrayListWithExpectedSize( extractedAdditionalSelectAliasNodes.size() + subquerySelectStatementToUse.getGroupBy().size()); for (AliasedNode aliasedNode : extractedAdditionalSelectAliasNodes) { newGroupByParseNodes.add(aliasedNode.getNode()); } newGroupByParseNodes.addAll(subquerySelectStatementToUse.getGroupBy()); return newGroupByParseNodes; } private static class JoinConditionExtractor extends AndRewriterBooleanParseNodeVisitor { private final TableName tableName; private ColumnResolveVisitor columnResolveVisitor; private List additionalSubselectSelectAliasedNodes; private List joinConditionParseNodes; public JoinConditionExtractor(SelectStatement subquery, ColumnResolver outerResolver, PhoenixConnection connection, String tableAlias) throws SQLException { super(NODE_FACTORY); this.tableName = NODE_FACTORY.table(null, tableAlias); ColumnResolver localResolver = FromCompiler.getResolverForQuery(subquery, connection); this.columnResolveVisitor = new ColumnResolveVisitor(localResolver, outerResolver); this.additionalSubselectSelectAliasedNodes = Lists.newArrayList(); this.joinConditionParseNodes = Lists.newArrayList(); } public List getAdditionalSubselectSelectAliasedNodes() { return this.additionalSubselectSelectAliasedNodes; } public ParseNode getJoinConditionParseNode() { if (this.joinConditionParseNodes.isEmpty()) { return null; } if (this.joinConditionParseNodes.size() == 1) { return this.joinConditionParseNodes.get(0); } return NODE_FACTORY.and(this.joinConditionParseNodes); } @Override protected ParseNode leaveBooleanNode(ParseNode node, List l) throws SQLException { columnResolveVisitor.reset(); node.accept(columnResolveVisitor); ColumnResolveVisitor.ColumnResolveType type = columnResolveVisitor.getColumnResolveType(); if (type != ColumnResolveVisitor.ColumnResolveType.NONE && type != ColumnResolveVisitor.ColumnResolveType.LOCAL) throw new SQLFeatureNotSupportedException("Does not support non-standard or non-equi correlated-subquery conditions."); return node; } @Override public ParseNode visitLeave(ComparisonParseNode node, List l) throws SQLException { if (node.getFilterOp() != CompareOperator.EQUAL) return leaveBooleanNode(node, l); columnResolveVisitor.reset(); node.getLHS().accept(columnResolveVisitor); ColumnResolveVisitor.ColumnResolveType lhsType = columnResolveVisitor.getColumnResolveType(); columnResolveVisitor.reset(); node.getRHS().accept(columnResolveVisitor); ColumnResolveVisitor.ColumnResolveType rhsType = columnResolveVisitor.getColumnResolveType(); if ((lhsType == ColumnResolveVisitor.ColumnResolveType.NONE || lhsType == ColumnResolveVisitor.ColumnResolveType.LOCAL) && (rhsType == ColumnResolveVisitor.ColumnResolveType.NONE || rhsType == ColumnResolveVisitor.ColumnResolveType.LOCAL)) { return node; } if (lhsType == ColumnResolveVisitor.ColumnResolveType.LOCAL && rhsType == ColumnResolveVisitor.ColumnResolveType.OUTER) { String alias = ParseNodeFactory.createTempAlias(); this.additionalSubselectSelectAliasedNodes.add( NODE_FACTORY.aliasedNode(alias, node.getLHS())); ParseNode lhsNode = NODE_FACTORY.column(tableName, alias, null); this.joinConditionParseNodes.add(NODE_FACTORY.equal(lhsNode, node.getRHS())); return null; } if (lhsType == ColumnResolveVisitor.ColumnResolveType.OUTER && rhsType == ColumnResolveVisitor.ColumnResolveType.LOCAL) { String alias = ParseNodeFactory.createTempAlias(); this.additionalSubselectSelectAliasedNodes.add( NODE_FACTORY.aliasedNode(alias, node.getRHS())); ParseNode rhsNode = NODE_FACTORY.column(tableName, alias, null); this.joinConditionParseNodes.add(NODE_FACTORY.equal(node.getLHS(), rhsNode)); return null; } throw new SQLFeatureNotSupportedException("Does not support non-standard or non-equi correlated-subquery conditions."); } } /* * Class for resolving inner query column references */ private static class ColumnResolveVisitor extends StatelessTraverseAllParseNodeVisitor { public enum ColumnResolveType {NONE, LOCAL, OUTER, MIXED}; private final ColumnResolver localResolver; private final ColumnResolver outerResolver; private ColumnResolveType type; public ColumnResolveVisitor(ColumnResolver localResolver, ColumnResolver outerResolver) { this.localResolver = localResolver; this.outerResolver = outerResolver; this.type = ColumnResolveType.NONE; } public void reset() { this.type = ColumnResolveType.NONE; } public ColumnResolveType getColumnResolveType() { return this.type; } @Override public Void visit(ColumnParseNode node) throws SQLException { // Inner query column definitions should shade those of outer query. try { localResolver.resolveColumn(node.getSchemaName(), node.getTableName(), node.getName()); addType(true); return null; } catch (TableNotFoundException e) { } catch (ColumnNotFoundException e) { } catch (ColumnFamilyNotFoundException e) { } outerResolver.resolveColumn(node.getSchemaName(), node.getTableName(), node.getName()); addType(false); return null; } private void addType(boolean isLocal) { switch (this.type) { case NONE: this.type = isLocal ? ColumnResolveType.LOCAL : ColumnResolveType.OUTER; break; case LOCAL: this.type = isLocal ? ColumnResolveType.LOCAL : ColumnResolveType.MIXED; break; case OUTER: this.type = isLocal ? ColumnResolveType.MIXED : ColumnResolveType.OUTER; break; default: // MIXED do nothing break; } } } }




© 2015 - 2025 Weber Informatics LLC | Privacy Policy