Many resources are needed to download a project. Please understand that we have to compensate our server costs. Thank you in advance. Project price only 1 $
You can buy this project and download/modify it how often you want.
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package io.trino.sql.planner.iterative.rule;
import com.google.common.collect.ImmutableList;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.ImmutableSet;
import io.trino.matching.Capture;
import io.trino.matching.Captures;
import io.trino.matching.Pattern;
import io.trino.sql.ir.Expression;
import io.trino.sql.ir.Reference;
import io.trino.sql.planner.PartitioningScheme;
import io.trino.sql.planner.Symbol;
import io.trino.sql.planner.iterative.Rule;
import io.trino.sql.planner.plan.Assignments;
import io.trino.sql.planner.plan.ExchangeNode;
import io.trino.sql.planner.plan.PlanNode;
import io.trino.sql.planner.plan.ProjectNode;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.stream.Collectors;
import static io.trino.matching.Capture.newCapture;
import static io.trino.sql.planner.ExpressionSymbolInliner.inlineSymbols;
import static io.trino.sql.planner.iterative.rule.Util.restrictOutputs;
import static io.trino.sql.planner.plan.Patterns.exchange;
import static io.trino.sql.planner.plan.Patterns.project;
import static io.trino.sql.planner.plan.Patterns.source;
/**
* Transforms:
*
* Project(x = e1, y = e2)
* Exchange()
* Source(a, b, c)
*
* to:
*
* Exchange()
* Project(x = e1, y = e2)
* Source(a, b, c)
*
* Or if Exchange needs symbols from Source for partitioning, ordering or as hash symbol to:
*
* Project(x, y)
* Exchange()
* Project(x = e1, y = e2, a)
* Source(a, b, c)
*
* To avoid looping this optimizer will not be fired if upper Project contains just symbol references.
*/
public class PushProjectionThroughExchange
implements Rule
{
private static final Capture CHILD = newCapture();
private static final Pattern PATTERN = project()
.matching(project -> !isSymbolToSymbolProjection(project))
.with(source().matching(exchange().capturedAs(CHILD)));
@Override
public Pattern getPattern()
{
return PATTERN;
}
@Override
public Result apply(ProjectNode project, Captures captures, Context context)
{
ExchangeNode exchange = captures.get(CHILD);
Set partitioningColumns = exchange.getPartitioningScheme().getPartitioning().getColumns();
ImmutableList.Builder newSourceBuilder = ImmutableList.builder();
ImmutableList.Builder> inputsBuilder = ImmutableList.builder();
for (int i = 0; i < exchange.getSources().size(); i++) {
Map outputToInputMap = mapExchangeOutputToInput(exchange, i);
Assignments.Builder projections = Assignments.builder();
ImmutableList.Builder inputs = ImmutableList.builder();
// Need to retain the partition keys for the exchange
partitioningColumns.stream()
.map(outputToInputMap::get)
.forEach(inputSymbol -> {
projections.putIdentity(inputSymbol);
inputs.add(inputSymbol);
});
// Need to retain the hash symbol for the exchange
exchange.getPartitioningScheme().getHashColumn()
.map(outputToInputMap::get)
.ifPresent(inputSymbol -> {
projections.putIdentity(inputSymbol);
inputs.add(inputSymbol);
});
if (exchange.getOrderingScheme().isPresent()) {
// Need to retain ordering columns for the exchange
exchange.getOrderingScheme().get().orderBy().stream()
// Do not duplicate symbols in inputs list
.filter(symbol -> !partitioningColumns.contains(symbol))
.map(outputToInputMap::get)
.forEach(inputSymbol -> {
projections.putIdentity(inputSymbol);
inputs.add(inputSymbol);
});
}
ImmutableSet.Builder outputBuilder = ImmutableSet.builder();
partitioningColumns.forEach(outputBuilder::add);
exchange.getPartitioningScheme().getHashColumn().ifPresent(outputBuilder::add);
exchange.getOrderingScheme().ifPresent(orderingScheme -> outputBuilder.addAll(orderingScheme.orderBy()));
Set partitioningHashAndOrderingOutputs = outputBuilder.build();
Map translationMap = outputToInputMap.entrySet().stream()
.collect(Collectors.toMap(Map.Entry::getKey, entry -> entry.getValue().toSymbolReference()));
for (Map.Entry projection : project.getAssignments().entrySet()) {
// Skip identity projection if symbol is in outputs already
if (partitioningHashAndOrderingOutputs.contains(projection.getKey())) {
continue;
}
Expression translatedExpression = inlineSymbols(translationMap, projection.getValue());
Symbol symbol = context.getSymbolAllocator().newSymbol(translatedExpression);
projections.put(symbol, translatedExpression);
inputs.add(symbol);
}
newSourceBuilder.add(new ProjectNode(context.getIdAllocator().getNextId(), exchange.getSources().get(i), projections.build()));
inputsBuilder.add(inputs.build());
}
// Construct the output symbols in the same order as the sources
ImmutableList.Builder outputBuilder = ImmutableList.builder();
partitioningColumns.forEach(outputBuilder::add);
exchange.getPartitioningScheme().getHashColumn().ifPresent(outputBuilder::add);
if (exchange.getOrderingScheme().isPresent()) {
exchange.getOrderingScheme().get().orderBy().stream()
// Do not duplicate symbols in outputs list (for consistency with inputs lists)
.filter(symbol -> !partitioningColumns.contains(symbol))
.forEach(outputBuilder::add);
}
Set partitioningHashAndOrderingOutputs = ImmutableSet.copyOf(outputBuilder.build());
for (Map.Entry projection : project.getAssignments().entrySet()) {
// Do not add output for identity projection if symbol is in outputs already
if (partitioningHashAndOrderingOutputs.contains(projection.getKey())) {
continue;
}
outputBuilder.add(projection.getKey());
}
// outputBuilder contains all partition and hash symbols so simply swap the output layout
PartitioningScheme partitioningScheme = new PartitioningScheme(
exchange.getPartitioningScheme().getPartitioning(),
outputBuilder.build(),
exchange.getPartitioningScheme().getHashColumn(),
exchange.getPartitioningScheme().isReplicateNullsAndAny(),
exchange.getPartitioningScheme().getBucketToPartition(),
exchange.getPartitioningScheme().getPartitionCount());
PlanNode result = new ExchangeNode(
exchange.getId(),
exchange.getType(),
exchange.getScope(),
partitioningScheme,
newSourceBuilder.build(),
inputsBuilder.build(),
exchange.getOrderingScheme());
// we need to strip unnecessary symbols (hash, partitioning columns).
return Result.ofPlanNode(restrictOutputs(context.getIdAllocator(), result, ImmutableSet.copyOf(project.getOutputSymbols())).orElse(result));
}
private static boolean isSymbolToSymbolProjection(ProjectNode project)
{
return project.getAssignments().getExpressions().stream().allMatch(Reference.class::isInstance);
}
private static Map mapExchangeOutputToInput(ExchangeNode exchange, int sourceIndex)
{
ImmutableMap.Builder outputToInputMap = ImmutableMap.builder();
for (int i = 0; i < exchange.getOutputSymbols().size(); i++) {
outputToInputMap.put(exchange.getOutputSymbols().get(i), exchange.getInputs().get(sourceIndex).get(i));
}
return outputToInputMap.buildOrThrow();
}
}