org.apache.hadoop.hive.ql.optimizer.ConstantPropagateProcCtx Maven / Gradle / Ivy
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.hadoop.hive.ql.optimizer;
import java.io.Serializable;
import java.util.ArrayList;
import java.util.HashMap;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import org.apache.commons.logging.LogFactory;
import org.apache.hadoop.hive.ql.exec.ColumnInfo;
import org.apache.hadoop.hive.ql.exec.Operator;
import org.apache.hadoop.hive.ql.exec.RowSchema;
import org.apache.hadoop.hive.ql.exec.UnionOperator;
import org.apache.hadoop.hive.ql.lib.NodeProcessorCtx;
import org.apache.hadoop.hive.ql.plan.ExprNodeDesc;
/**
* This class implements the processor context for Constant Propagate.
*
* ConstantPropagateProcCtx keeps track of propagated constants in a column->const map for each
* operator, enabling constants to be revolved across operators.
*/
public class ConstantPropagateProcCtx implements NodeProcessorCtx {
private static final org.apache.commons.logging.Log LOG = LogFactory
.getLog(ConstantPropagateProcCtx.class);
private final Map, Map> opToConstantExprs;
private final List> opToDelete;
public ConstantPropagateProcCtx() {
opToConstantExprs =
new HashMap, Map>();
opToDelete = new ArrayList>();
}
public Map, Map> getOpToConstantExprs() {
return opToConstantExprs;
}
/**
* Resolve a ColumnInfo based on given RowResolver.
*
* @param ci
* @param rr
* @param parentRR
* @return
* @throws SemanticException
*/
private ColumnInfo resolve(ColumnInfo ci, RowSchema rs, RowSchema parentRS) {
// Resolve new ColumnInfo from
String alias = ci.getAlias();
if (alias == null) {
alias = ci.getInternalName();
}
String tblAlias = ci.getTabAlias();
ColumnInfo rci = rs.getColumnInfo(tblAlias, alias);
if (rci == null && rs.getTableNames().size() == 1 &&
parentRS.getTableNames().size() == 1) {
rci = rs.getColumnInfo(rs.getTableNames().iterator().next(),
alias);
}
if (rci == null) {
return null;
}
LOG.debug("Resolved "
+ ci.getTabAlias() + "." + ci.getAlias() + " as "
+ rci.getTabAlias() + "." + rci.getAlias() + " with rs: " + rs);
return rci;
}
/**
* Get propagated constant map from parents.
*
* Traverse all parents of current operator, if there is propagated constant (determined by
* assignment expression like column=constant value), resolve the column using RowResolver and add
* it to current constant map.
*
* @param op
* operator getting the propagated constants.
* @return map of ColumnInfo to ExprNodeDesc. The values of that map must be either
* ExprNodeConstantDesc or ExprNodeNullDesc.
*/
public Map getPropagatedConstants(
Operator extends Serializable> op) {
Map constants = new HashMap();
if (op.getSchema() == null) {
return constants;
}
RowSchema rs = op.getSchema();
LOG.debug("Getting constants of op:" + op + " with rs:" + rs);
if (op.getParentOperators() == null) {
return constants;
}
if (op instanceof UnionOperator) {
String alias = rs.getSignature().get(0).getTabAlias();
// find intersection
Map intersection = null;
for (Operator> parent : op.getParentOperators()) {
Map unionConst = opToConstantExprs.get(parent);
LOG.debug("Constant of op " + parent.getOperatorId() + " " + unionConst);
if (intersection == null) {
intersection = new HashMap();
for (Entry e : unionConst.entrySet()) {
ColumnInfo ci = new ColumnInfo(e.getKey());
ci.setTabAlias(alias);
intersection.put(ci, e.getValue());
}
} else {
Iterator> itr = intersection.entrySet().iterator();
while (itr.hasNext()) {
Entry e = itr.next();
boolean found = false;
for (Entry f : opToConstantExprs.get(parent).entrySet()) {
if (e.getKey().getInternalName().equals(f.getKey().getInternalName())) {
if (e.getValue().isSame(f.getValue())) {
found = true;
}
break;
}
}
if (!found) {
itr.remove();
}
}
}
if (intersection.isEmpty()) {
return intersection;
}
}
LOG.debug("Propagated union constants:" + intersection);
return intersection;
}
for (Operator extends Serializable> parent : op.getParentOperators()) {
Map c = opToConstantExprs.get(parent);
for (Entry e : c.entrySet()) {
ColumnInfo ci = e.getKey();
ColumnInfo rci = null;
ExprNodeDesc constant = e.getValue();
rci = resolve(ci, rs, parent.getSchema());
if (rci != null) {
constants.put(rci, constant);
} else {
LOG.debug("Can't resolve " + ci.getTabAlias() + "." + ci.getAlias() +
"(" + ci.getInternalName() + ") from rs:" + rs);
}
}
}
LOG.debug("Offerring constants " + constants.keySet()
+ " to operator " + op.toString());
return constants;
}
public void addOpToDelete(Operator extends Serializable> op) {
opToDelete.add(op);
}
public List> getOpToDelete() {
return opToDelete;
}
}