All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.pig.newplan.PlanDumper Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.pig.newplan;

import java.io.PrintStream;
import java.util.Iterator;
import java.util.LinkedList;
import java.util.Collection;
import org.apache.pig.impl.util.MultiMap;

/**
 * This class dumps a nested plan to a print stream. It does not walk
 * the graph in any particular fashion it merely iterates over all
 * operators and edges and calls a corresponding dump function. If a
 * node of the plan has nested plans this will be dumped when the
 * node is handled.
 */
public class PlanDumper {
    
    protected PrintStream ps;
    protected BaseOperatorPlan plan;
    protected boolean isVerbose = true;
  
    public PlanDumper(BaseOperatorPlan plan, PrintStream ps) {
        this.plan = plan;
        this.ps = ps;
    }

    public void setVerbose(boolean verbose) {
        this.isVerbose = verbose;
    }

    public boolean isVerbose() {
        return isVerbose;
    }

    /**
     * This is the public interface. Dump writes the plan and nested
     * plans to the stream.
     */
    public void dump() {
        Iterator iter = plan.getOperators();
        while (iter.hasNext()) {
            Operator op = iter.next();
            MultiMap map = getMultiInputNestedPlans(op);
            if (isVerbose && !map.isEmpty()) {
                dumpMultiInputNestedOperator(op, map);
                continue;
            }

            Collection plans = getMultiOutputNestedPlans(op);
            if (plans.size() > 0) {
                dumpMultiOutputNestedOperator(op, plans);
                continue;
            }
            
            plans = getNestedPlans(op);
            if (isVerbose && plans.size() > 0) {
                dumpNestedOperator(op, plans);
                continue;
            }

            dumpOperator(op);
        }

        iter = plan.getOperators();
        while (iter.hasNext()) {
            Operator op = iter.next();
            Collection successors = plan.getSuccessors(op);
            if (successors != null) {
                for (Operator suc: successors) {
                    dumpEdge(op, suc);
                }
            }
        }
    }

    /**
     * makeDumper is a factory method. Used by subclasses to specify
     * what dumper should handle the nested plan.
     * @param plan Plan that the new dumper should handle
     * @return the dumper for plan
     */
    @SuppressWarnings("unchecked")
    protected PlanDumper makeDumper(BaseOperatorPlan plan, PrintStream ps) {
        return new PlanDumper(plan, ps);
    }

    /**
     * Will be called to dump a simple operator
     * @param op the operator to be dumped
     */
    protected void dumpOperator(Operator op) {
        ps.println(op.getName().replace(" ","_"));
    }

    /**
     * Will be called when an operator has nested plans, which are
     * connected to one of the multiple inputs.
     * @param op the nested operator
     * @param plans a map of input operator to connected nested plan
     */
    protected void dumpMultiInputNestedOperator(Operator op, MultiMap plans) {
        dumpOperator(op);
        for (Operator aop: plans.keySet()) {
            for (BaseOperatorPlan plan: plans.get(aop)) {
                PlanDumper dumper = makeDumper(plan, ps);
                dumper.dump();
            }
        }
    }

    /**
     * Will be called for nested operators, where the plans represent
     * how the output of the operator is processed. 
     * @param op the nested operator
     * @param plans a collection of sub plans.
     */
    protected void dumpMultiOutputNestedOperator(Operator op, Collection plans) {
        dumpOperator(op);
        for (BaseOperatorPlan plan: plans) {
            PlanDumper  dumper = makeDumper(plan, ps);
            dumper.dump();
            for (Operator p: plan.getSources()) {
                dumpEdge(op, p);
            }
        }
    }

    /**
     * Will be called for nested operators. The operators are not
     * specifically connected to any input or output operators of E
     * @param op the nested operator
     * @param plans a collection of sub plans.
     */
    protected void dumpNestedOperator(Operator op, Collection plans) {
        dumpOperator(op);
        for (BaseOperatorPlan plan: plans) {
            PlanDumper  dumper = makeDumper(plan, ps);
            dumper.dump();
        }
    }

    /**
     * Will be called to dump the edges of the plan. Each edge results
     * in one call.
     * @param op tail of the edge
     * @param suc head of the edge
     */
    protected void dumpEdge(Operator op, Operator suc) {
        ps.println(op.getName()+" -> "+suc.getName());
    }

    /**
     * Used to determine if an operator has nested plans, which are
     * connected to specific input operators.
     * @param op operator
     * @return Map describing the input to nested plan relationship.
     */
    protected MultiMap getMultiInputNestedPlans(Operator op) {
        return new MultiMap();
    }

    /**
     * Used to determine if an operator has nested output plans
     *
     * @param op operator
     * @return Map describing the input to nested plan relationship.
     */
    protected Collection getMultiOutputNestedPlans(Operator op) {
        return new LinkedList();
    }

    /**
     * Used to determine if an operator has nested plans (without
     * connections to in- or output operators.
     * @param op operator
     * @return Collection of nested plans.
     */
    protected Collection getNestedPlans(Operator op) {
        return new LinkedList();
    }

    /**
     * Helper function to print a string array.
     * @param sep Separator
     * @param strings Array to print
     */
    protected void join(String sep, String[] strings) {
        if (strings == null) {
            return;
        }
        
        for (int i = 0; i < strings.length; ++i) {
            if (i != 0) {
                ps.print(sep);
            }
            ps.print(strings[i]);
        }
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy