org.apache.pig.newplan.PlanDumper Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.pig.newplan;
import java.io.PrintStream;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.Collection;
import org.apache.pig.impl.util.MultiMap;
/**
* This class dumps a nested plan to a print stream. It does not walk
* the graph in any particular fashion it merely iterates over all
* operators and edges and calls a corresponding dump function. If a
* node of the plan has nested plans this will be dumped when the
* node is handled.
*/
public class PlanDumper {
protected PrintStream ps;
protected BaseOperatorPlan plan;
protected boolean isVerbose = true;
public PlanDumper(BaseOperatorPlan plan, PrintStream ps) {
this.plan = plan;
this.ps = ps;
}
public void setVerbose(boolean verbose) {
this.isVerbose = verbose;
}
public boolean isVerbose() {
return isVerbose;
}
/**
* This is the public interface. Dump writes the plan and nested
* plans to the stream.
*/
public void dump() {
Iterator iter = plan.getOperators();
while (iter.hasNext()) {
Operator op = iter.next();
MultiMap map = getMultiInputNestedPlans(op);
if (isVerbose && !map.isEmpty()) {
dumpMultiInputNestedOperator(op, map);
continue;
}
Collection plans = getMultiOutputNestedPlans(op);
if (plans.size() > 0) {
dumpMultiOutputNestedOperator(op, plans);
continue;
}
plans = getNestedPlans(op);
if (isVerbose && plans.size() > 0) {
dumpNestedOperator(op, plans);
continue;
}
dumpOperator(op);
}
iter = plan.getOperators();
while (iter.hasNext()) {
Operator op = iter.next();
Collection successors = plan.getSuccessors(op);
if (successors != null) {
for (Operator suc: successors) {
dumpEdge(op, suc);
}
}
}
}
/**
* makeDumper is a factory method. Used by subclasses to specify
* what dumper should handle the nested plan.
* @param plan Plan that the new dumper should handle
* @return the dumper for plan
*/
@SuppressWarnings("unchecked")
protected PlanDumper makeDumper(BaseOperatorPlan plan, PrintStream ps) {
return new PlanDumper(plan, ps);
}
/**
* Will be called to dump a simple operator
* @param op the operator to be dumped
*/
protected void dumpOperator(Operator op) {
ps.println(op.getName().replace(" ","_"));
}
/**
* Will be called when an operator has nested plans, which are
* connected to one of the multiple inputs.
* @param op the nested operator
* @param plans a map of input operator to connected nested plan
*/
protected void dumpMultiInputNestedOperator(Operator op, MultiMap plans) {
dumpOperator(op);
for (Operator aop: plans.keySet()) {
for (BaseOperatorPlan plan: plans.get(aop)) {
PlanDumper dumper = makeDumper(plan, ps);
dumper.dump();
}
}
}
/**
* Will be called for nested operators, where the plans represent
* how the output of the operator is processed.
* @param op the nested operator
* @param plans a collection of sub plans.
*/
protected void dumpMultiOutputNestedOperator(Operator op, Collection plans) {
dumpOperator(op);
for (BaseOperatorPlan plan: plans) {
PlanDumper dumper = makeDumper(plan, ps);
dumper.dump();
for (Operator p: plan.getSources()) {
dumpEdge(op, p);
}
}
}
/**
* Will be called for nested operators. The operators are not
* specifically connected to any input or output operators of E
* @param op the nested operator
* @param plans a collection of sub plans.
*/
protected void dumpNestedOperator(Operator op, Collection plans) {
dumpOperator(op);
for (BaseOperatorPlan plan: plans) {
PlanDumper dumper = makeDumper(plan, ps);
dumper.dump();
}
}
/**
* Will be called to dump the edges of the plan. Each edge results
* in one call.
* @param op tail of the edge
* @param suc head of the edge
*/
protected void dumpEdge(Operator op, Operator suc) {
ps.println(op.getName()+" -> "+suc.getName());
}
/**
* Used to determine if an operator has nested plans, which are
* connected to specific input operators.
* @param op operator
* @return Map describing the input to nested plan relationship.
*/
protected MultiMap getMultiInputNestedPlans(Operator op) {
return new MultiMap();
}
/**
* Used to determine if an operator has nested output plans
*
* @param op operator
* @return Map describing the input to nested plan relationship.
*/
protected Collection getMultiOutputNestedPlans(Operator op) {
return new LinkedList();
}
/**
* Used to determine if an operator has nested plans (without
* connections to in- or output operators.
* @param op operator
* @return Collection of nested plans.
*/
protected Collection getNestedPlans(Operator op) {
return new LinkedList();
}
/**
* Helper function to print a string array.
* @param sep Separator
* @param strings Array to print
*/
protected void join(String sep, String[] strings) {
if (strings == null) {
return;
}
for (int i = 0; i < strings.length; ++i) {
if (i != 0) {
ps.print(sep);
}
ps.print(strings[i]);
}
}
}