org.apache.drill.exec.planner.physical.ScanPrel Maven / Gradle / Ivy
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.drill.exec.planner.physical;
import java.io.IOException;
import java.util.Collections;
import java.util.Iterator;
import java.util.List;
import org.apache.drill.common.exceptions.DrillRuntimeException;
import org.apache.drill.common.exceptions.ExecutionSetupException;
import org.apache.drill.exec.physical.base.GroupScan;
import org.apache.drill.exec.physical.base.PhysicalOperator;
import org.apache.drill.exec.physical.base.ScanStats;
import org.apache.drill.exec.planner.cost.DrillCostBase.DrillCostFactory;
import org.apache.drill.exec.planner.physical.visitor.PrelVisitor;
import org.apache.drill.exec.record.BatchSchema.SelectionVectorMode;
import org.apache.calcite.rel.AbstractRelNode;
import org.apache.calcite.rel.RelNode;
import org.apache.calcite.rel.RelWriter;
import org.apache.calcite.plan.RelOptCluster;
import org.apache.calcite.plan.RelOptCost;
import org.apache.calcite.plan.RelOptPlanner;
import org.apache.calcite.plan.RelTraitSet;
import org.apache.calcite.rel.type.RelDataType;
public class ScanPrel extends AbstractRelNode implements DrillScanPrel {
static final org.slf4j.Logger logger = org.slf4j.LoggerFactory
.getLogger(ScanPrel.class);
protected final GroupScan groupScan;
private final RelDataType rowType;
public ScanPrel(RelOptCluster cluster, RelTraitSet traits,
GroupScan groupScan, RelDataType rowType) {
super(cluster, traits);
this.groupScan = getCopy(groupScan);
this.rowType = rowType;
}
@Override
public RelNode copy(RelTraitSet traitSet, List inputs) {
return new ScanPrel(this.getCluster(), traitSet, groupScan,
this.rowType);
}
@Override
protected Object clone() throws CloneNotSupportedException {
return new ScanPrel(this.getCluster(), this.getTraitSet(), getCopy(groupScan),
this.rowType);
}
private static GroupScan getCopy(GroupScan scan){
try {
return (GroupScan) scan.getNewWithChildren((List) (Object) Collections.emptyList());
} catch (ExecutionSetupException e) {
throw new DrillRuntimeException("Unexpected failure while coping node.", e);
}
}
@Override
public PhysicalOperator getPhysicalOperator(PhysicalPlanCreator creator)
throws IOException {
return creator.addMetadata(this, groupScan);
}
@Override
public GroupScan getGroupScan() {
return groupScan;
}
public static ScanPrel create(RelNode old, RelTraitSet traitSets,
GroupScan scan, RelDataType rowType) {
return new ScanPrel(old.getCluster(), traitSets, getCopy(scan), rowType);
}
@Override
public RelWriter explainTerms(RelWriter pw) {
return super.explainTerms(pw).item("groupscan", groupScan.getDigest());
}
@Override
public RelDataType deriveRowType() {
return this.rowType;
}
@Override
public double getRows() {
final PlannerSettings settings = PrelUtil.getPlannerSettings(getCluster());
return this.groupScan.getScanStats(settings).getRecordCount();
}
@Override
public RelOptCost computeSelfCost(final RelOptPlanner planner) {
final PlannerSettings settings = PrelUtil.getPlannerSettings(planner);
final ScanStats stats = this.groupScan.getScanStats(settings);
final int columnCount = this.getRowType().getFieldCount();
if(PrelUtil.getSettings(getCluster()).useDefaultCosting()) {
return planner.getCostFactory().makeCost(stats.getRecordCount() * columnCount, stats.getCpuCost(), stats.getDiskCost());
}
// double rowCount = RelMetadataQuery.getRowCount(this);
double rowCount = stats.getRecordCount();
// As DRILL-4083 points out, when columnCount == 0, cpuCost becomes zero,
// which makes the costs of HiveScan and HiveDrillNativeParquetScan the same
double cpuCost = rowCount * Math.max(columnCount, 1); // For now, assume cpu cost is proportional to row count.
// If a positive value for CPU cost is given multiply the default CPU cost by given CPU cost.
if (stats.getCpuCost() > 0) {
cpuCost *= stats.getCpuCost();
}
// Even though scan is reading from disk, in the currently generated plans all plans will
// need to read the same amount of data, so keeping the disk io cost 0 is ok for now.
// In the future we might consider alternative scans that go against projections or
// different compression schemes etc that affect the amount of data read. Such alternatives
// would affect both cpu and io cost.
double ioCost = 0;
DrillCostFactory costFactory = (DrillCostFactory)planner.getCostFactory();
return costFactory.makeCost(rowCount, cpuCost, ioCost, 0);
}
@Override
public Iterator iterator() {
return Collections.emptyIterator();
}
@Override
public T accept(PrelVisitor logicalVisitor, X value) throws E {
return logicalVisitor.visitScan(this, value);
}
@Override
public SelectionVectorMode[] getSupportedEncodings() {
return SelectionVectorMode.DEFAULT;
}
@Override
public SelectionVectorMode getEncoding() {
return SelectionVectorMode.NONE;
}
@Override
public boolean needsFinalColumnReordering() {
return true;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy