org.apache.druid.sql.calcite.rel.Windowing Maven / Gradle / Ivy

Go to download
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */

package org.apache.druid.sql.calcite.rel;

import com.google.common.annotations.VisibleForTesting;
import com.google.common.base.Preconditions;
import com.google.common.collect.ImmutableMap;
import com.google.common.collect.Iterables;
import org.apache.calcite.rel.RelCollation;
import org.apache.calcite.rel.RelCollationTraitDef;
import org.apache.calcite.rel.RelFieldCollation;
import org.apache.calcite.rel.core.AggregateCall;
import org.apache.calcite.rel.core.Project;
import org.apache.calcite.rel.core.Window;
import org.apache.calcite.rex.RexBuilder;
import org.apache.calcite.rex.RexInputRef;
import org.apache.calcite.rex.RexLiteral;
import org.apache.calcite.rex.RexNode;
import org.apache.calcite.rex.RexWindowBound;
import org.apache.calcite.util.mapping.Mappings;
import org.apache.druid.java.util.common.ISE;
import org.apache.druid.java.util.common.StringUtils;
import org.apache.druid.query.QueryException;
import org.apache.druid.query.aggregation.AggregatorFactory;
import org.apache.druid.query.operator.ColumnWithDirection;
import org.apache.druid.query.operator.NaivePartitioningOperatorFactory;
import org.apache.druid.query.operator.NaiveSortOperatorFactory;
import org.apache.druid.query.operator.OperatorFactory;
import org.apache.druid.query.operator.window.ComposingProcessor;
import org.apache.druid.query.operator.window.Processor;
import org.apache.druid.query.operator.window.WindowFrame;
import org.apache.druid.query.operator.window.WindowFramedAggregateProcessor;
import org.apache.druid.query.operator.window.WindowOperatorFactory;
import org.apache.druid.query.operator.window.ranking.WindowCumeDistProcessor;
import org.apache.druid.query.operator.window.ranking.WindowDenseRankProcessor;
import org.apache.druid.query.operator.window.ranking.WindowPercentileProcessor;
import org.apache.druid.query.operator.window.ranking.WindowRankProcessor;
import org.apache.druid.query.operator.window.ranking.WindowRowNumberProcessor;
import org.apache.druid.query.operator.window.value.WindowFirstProcessor;
import org.apache.druid.query.operator.window.value.WindowLastProcessor;
import org.apache.druid.query.operator.window.value.WindowOffsetProcessor;
import org.apache.druid.segment.column.RowSignature;
import org.apache.druid.sql.calcite.aggregation.Aggregation;
import org.apache.druid.sql.calcite.expression.DruidExpression;
import org.apache.druid.sql.calcite.expression.Expressions;
import org.apache.druid.sql.calcite.planner.Calcites;
import org.apache.druid.sql.calcite.planner.PlannerContext;
import org.apache.druid.sql.calcite.rule.GroupByRules;
import org.apache.druid.sql.calcite.table.RowSignatures;

import javax.annotation.Nonnull;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Iterator;
import java.util.LinkedHashSet;
import java.util.List;

/**
 * Maps onto a {@link org.apache.druid.query.operator.WindowOperatorQuery}.
 * 
 * Known sharp-edges/limitations:
 * 1. The support is not yet fully aware of the difference between RANGE and ROWS when evaluating peers. (Note: The
 * built-in functions are all implemented with the correctly defined semantics, so ranking functions that are
 * defined to use RANGE do the right thing)
 * 2. No support for framing last/first functions
 * 3. No nth function
 * 4. No finalization, meaning that aggregators like sketches that rely on finalization might return surprising results
 * 5. No big big test suite of loveliness
 */
public class Windowing
{
  @VisibleForTesting
  public static final ImmutableMap KNOWN_WINDOW_FNS = ImmutableMap
      .builder()
      .put("LAG", (agg) ->
          new WindowOffsetProcessor(agg.getColumn(0), agg.getOutputName(), -agg.getConstantInt(1, 1)))
      .put("LEAD", (agg) ->
          new WindowOffsetProcessor(agg.getColumn(0), agg.getOutputName(), agg.getConstantInt(1, 1)))
      .put("FIRST_VALUE", (agg) ->
          new WindowFirstProcessor(agg.getColumn(0), agg.getOutputName()))
      .put("LAST_VALUE", (agg) ->
          new WindowLastProcessor(agg.getColumn(0), agg.getOutputName()))
      .put("CUME_DIST", (agg) ->
          new WindowCumeDistProcessor(agg.getGroup().getOrderingColumNames(), agg.getOutputName()))
      .put("DENSE_RANK", (agg) ->
          new WindowDenseRankProcessor(agg.getGroup().getOrderingColumNames(), agg.getOutputName()))
      .put("NTILE", (agg) ->
          new WindowPercentileProcessor(agg.getOutputName(), agg.getConstantInt(0)))
      .put("PERCENT_RANK", (agg) ->
          new WindowRankProcessor(agg.getGroup().getOrderingColumNames(), agg.getOutputName(), true))
      .put("RANK", (agg) ->
          new WindowRankProcessor(agg.getGroup().getOrderingColumNames(), agg.getOutputName(), false))
      .put("ROW_NUMBER", (agg) ->
          new WindowRowNumberProcessor(agg.getOutputName()))
      .build();
  private final List ops;

  @Nonnull
  public static Windowing fromCalciteStuff(
      final PartialDruidQuery partialQuery,
      final PlannerContext plannerContext,
      final RowSignature sourceRowSignature,
      final RexBuilder rexBuilder,
      final VirtualColumnRegistry virtualColumnRegistry
  )
  {
    final Window window = Preconditions.checkNotNull(partialQuery.getWindow(), "window");

    ArrayList ops = new ArrayList<>();

    final List windowOutputColumns = new ArrayList<>(sourceRowSignature.getColumnNames());
    final String outputNamePrefix = Calcites.findUnusedPrefixForDigits("w", sourceRowSignature.getColumnNames());
    int outputNameCounter = 0;

    // Track prior partition columns and sort columns group-to-group, so we only insert sorts and repartitions if
    // we really need to.
    List priorPartitionColumns = null;
    LinkedHashSet priorSortColumns = new LinkedHashSet<>();

    final RelCollation priorCollation = partialQuery.getScan().getTraitSet().getTrait(RelCollationTraitDef.INSTANCE);
    if (priorCollation != null) {
      // Populate initial priorSortColumns using collation of the input to the window operation. Allows us to skip
      // the initial sort operator if the rows were already in the desired order.
      priorSortColumns = computeSortColumnsFromRelCollation(priorCollation, sourceRowSignature);
    }

    for (int i = 0; i < window.groups.size(); ++i) {
      final WindowGroup group = new WindowGroup(window, window.groups.get(i), sourceRowSignature);

      final LinkedHashSet sortColumns = new LinkedHashSet<>();
      for (String partitionColumn : group.getPartitionColumns()) {
        sortColumns.add(ColumnWithDirection.ascending(partitionColumn));
      }
      sortColumns.addAll(group.getOrdering());

      // Add sorting and partitioning if needed.
      if (!sortMatches(priorSortColumns, sortColumns)) {
        // Sort order needs to change. Resort and repartition.
        ops.add(new NaiveSortOperatorFactory(new ArrayList<>(sortColumns)));
        ops.add(new NaivePartitioningOperatorFactory(group.getPartitionColumns()));
        priorSortColumns = sortColumns;
        priorPartitionColumns = group.getPartitionColumns();
      } else if (!group.getPartitionColumns().equals(priorPartitionColumns)) {
        // Sort order doesn't need to change, but partitioning does. Only repartition.
        ops.add(new NaivePartitioningOperatorFactory(group.getPartitionColumns()));
        priorPartitionColumns = group.getPartitionColumns();
      }

      // Add aggregations.
      final List aggregateCalls = group.getAggregateCalls();

      final List processors = new ArrayList<>();
      final List aggregations = new ArrayList<>();

      for (AggregateCall aggregateCall : aggregateCalls) {
        final String aggName = outputNamePrefix + outputNameCounter++;
        windowOutputColumns.add(aggName);

        ProcessorMaker maker = KNOWN_WINDOW_FNS.get(aggregateCall.getAggregation().getName());
        if (maker == null) {

          final Aggregation aggregation = GroupByRules.translateAggregateCall(
              plannerContext,
              sourceRowSignature,
              virtualColumnRegistry,
              rexBuilder,
              InputAccessor.buildFor(
                  window,
                  partialQuery.getSelectProject(),
                  sourceRowSignature),
              Collections.emptyList(),
              aggName,
              aggregateCall,
              false // Windowed aggregations don't currently finalize.  This means that sketches won't work as expected.
          );

          if (aggregation == null
              || aggregation.getPostAggregator() != null
              || aggregation.getAggregatorFactories().size() != 1) {
            if (null == plannerContext.getPlanningError()) {
              plannerContext.setPlanningError("Aggregation [%s] is not supported", aggregateCall);
            }
            throw new CannotBuildQueryException(window, aggregateCall);
          }

          aggregations.add(Iterables.getOnlyElement(aggregation.getAggregatorFactories()));
        } else {
          processors.add(
              maker.make(
                  new WindowAggregate(
                      aggName,
                      aggregateCall,
                      sourceRowSignature,
                      plannerContext,
                      rexBuilder,
                      partialQuery.getSelectProject(),
                      window.constants,
                      group
                  )
              )
          );
        }
      }

      if (!aggregations.isEmpty()) {
        processors.add(
            new WindowFramedAggregateProcessor(
                group.getWindowFrame(),
                aggregations.toArray(new AggregatorFactory[0])
            )
        );
      }

      if (processors.isEmpty()) {
        throw new ISE("No processors from Window[%s], why was this code called?", window);
      }

      ops.add(new WindowOperatorFactory(
          processors.size() == 1 ?
          processors.get(0) : new ComposingProcessor(processors.toArray(new Processor[0]))
      ));
    }

    // Apply windowProject, if present.
    if (partialQuery.getWindowProject() != null) {
      // We know windowProject is a mapping due to the isMapping() check in DruidRules.
      // check anyway as defensive programming.
      Preconditions.checkArgument(partialQuery.getWindowProject().isMapping());
      final Mappings.TargetMapping mapping = Preconditions.checkNotNull(
          Project.getPartialMapping(
              partialQuery.getWindowProject().getInput().getRowType().getFieldCount(),
              partialQuery.getWindowProject().getProjects()
          ),
          "mapping for windowProject[%s]",
          partialQuery.getWindowProject()
      );

      final List windowProjectOutputColumns = new ArrayList<>();
      for (int i = 0; i < mapping.size(); i++) {
        windowProjectOutputColumns.add(windowOutputColumns.get(mapping.getSourceOpt(i)));
      }

      return new Windowing(
          RowSignatures.fromRelDataType(windowProjectOutputColumns, partialQuery.getWindowProject().getRowType()),
          ops
      );
    } else {
      // No windowProject.
      return new Windowing(
          RowSignatures.fromRelDataType(windowOutputColumns, window.getRowType()),
          ops
      );
    }
  }

  private final RowSignature signature;

  public Windowing(
      final RowSignature signature,
      List ops
  )
  {
    this.signature = signature;
    this.ops = ops;
  }

  public RowSignature getSignature()
  {
    return signature;
  }

  public List getOperators()
  {
    return ops;
  }

  private interface ProcessorMaker
  {
    Processor make(WindowAggregate agg);
  }

  private static class WindowGroup
  {
    private final Window window;
    private final RowSignature sig;
    private final Window.Group group;

    public WindowGroup(Window window, Window.Group group, RowSignature sig)
    {
      this.window = window;
      this.sig = sig;
      this.group = group;
    }

    public ArrayList getPartitionColumns()
    {
      final ArrayList retVal = new ArrayList<>();
      for (int groupKey : group.keys) {
        retVal.add(sig.getColumnName(groupKey));
      }
      return retVal;
    }

    public ArrayList getOrdering()
    {
      final List fields = group.orderKeys.getFieldCollations();
      ArrayList retVal = new ArrayList<>(fields.size());
      for (RelFieldCollation field : fields) {
        final ColumnWithDirection.Direction direction;
        switch (field.direction) {
          case ASCENDING:
            direction = ColumnWithDirection.Direction.ASC;
            break;
          case DESCENDING:
            direction = ColumnWithDirection.Direction.DESC;
            break;
          default:
            throw new QueryException(
                QueryException.SQL_QUERY_UNSUPPORTED_ERROR_CODE,
                StringUtils.format("Cannot handle ordering with direction[%s]", field.direction),
                null,
                null
            );
        }
        retVal.add(new ColumnWithDirection(sig.getColumnName(field.getFieldIndex()), direction));
      }
      return retVal;
    }

    public ArrayList getOrderingColumNames()
    {
      final ArrayList ordering = getOrdering();
      final ArrayList retVal = new ArrayList<>(ordering.size());
      for (ColumnWithDirection column : ordering) {
        retVal.add(column.getColumn());
      }
      return retVal;
    }

    public List getAggregateCalls()
    {
      return group.getAggregateCalls(window);
    }

    public WindowFrame getWindowFrame()
    {
      if (group.lowerBound.isUnbounded() && group.upperBound.isUnbounded()) {
        return WindowFrame.unbounded();
      }
      return new WindowFrame(
          group.isRows ? WindowFrame.PeerType.ROWS : WindowFrame.PeerType.RANGE,
          group.lowerBound.isUnbounded(),
          figureOutOffset(group.lowerBound),
          group.upperBound.isUnbounded(),
          figureOutOffset(group.upperBound),
          group.isRows ? null : getOrdering()
      );
    }

    private int figureOutOffset(RexWindowBound bound)
    {
      if (bound.isUnbounded() || bound.isCurrentRow()) {
        return 0;
      }
      return getConstant(((RexInputRef) bound.getOffset()).getIndex());
    }

    private int getConstant(int refIndex)
    {
      return ((Number) window.constants.get(refIndex - sig.size()).getValue()).intValue();
    }
  }

  private static class WindowAggregate
  {
    private final String outputName;
    private final AggregateCall call;
    private final RowSignature sig;
    private final PlannerContext context;
    private final RexBuilder rexBuilder;
    private final Project project;
    private final List constants;
    private final WindowGroup group;

    private WindowAggregate(
        String outputName,
        AggregateCall call,
        RowSignature sig,
        PlannerContext context,
        RexBuilder rexBuilder,
        Project project,
        List constants,
        WindowGroup group
    )
    {
      this.outputName = outputName;
      this.call = call;
      this.sig = sig;
      this.context = context;
      this.rexBuilder = rexBuilder;
      this.project = project;
      this.constants = constants;
      this.group = group;

      if (project != null) {
        throw new ISE("Suddenly, the project[%s] is no longer null, the code might need to change.", project);
      }
    }

    public String getOutputName()
    {
      return outputName;
    }

    public WindowGroup getGroup()
    {
      return group;
    }

    public String getColumn(int argPosition)
    {
      final RexNode columnArgument =
          Expressions.fromFieldAccess(rexBuilder.getTypeFactory(), sig, project, call.getArgList().get(argPosition));
      final DruidExpression expression = Expressions.toDruidExpression(context, sig, columnArgument);
      if (expression == null) {
        throw new ISE("Couldn't get an expression from columnArgument[%s]", columnArgument);
      }
      return expression.getDirectColumn();
    }

    public RexLiteral getConstantArgument(int argPosition)
    {
      return constants.get(call.getArgList().get(argPosition) - sig.size());
    }

    public int getConstantInt(int argPosition)
    {
      return ((Number) getConstantArgument(argPosition).getValue()).intValue();
    }

    public int getConstantInt(int argPosition, int defaultValue)
    {
      if (argPosition >= call.getArgList().size()) {
        return defaultValue;
      }
      return getConstantInt(argPosition);
    }
  }

  /**
   * Return a list of {@link ColumnWithDirection} corresponding to a {@link RelCollation}.
   *
   * @param collation          collation
   * @param sourceRowSignature signature of the collated rows
   */
  private static LinkedHashSet computeSortColumnsFromRelCollation(
      final RelCollation collation,
      final RowSignature sourceRowSignature
  )
  {
    final LinkedHashSet retVal = new LinkedHashSet<>();

    for (RelFieldCollation fieldCollation : collation.getFieldCollations()) {
      final ColumnWithDirection.Direction direction;

      switch (fieldCollation.getDirection()) {
        case ASCENDING:
        case STRICTLY_ASCENDING:
          direction = ColumnWithDirection.Direction.ASC;
          break;

        case DESCENDING:
        case STRICTLY_DESCENDING:
          direction = ColumnWithDirection.Direction.DESC;
          break;

        default:
          // Not a useful direction. Return whatever we've come up with so far.
          return retVal;
      }

      final ColumnWithDirection columnWithDirection = new ColumnWithDirection(
          sourceRowSignature.getColumnName(fieldCollation.getFieldIndex()),
          direction
      );

      retVal.add(columnWithDirection);
    }

    return retVal;
  }

  /**
   * Whether currentSort is a prefix of priorSort. (i.e., whether data sorted by priorSort is *also* sorted
   * by currentSort.)
   */
  private static boolean sortMatches(
      final Iterable priorSort,
      final Iterable currentSort
  )
  {
    final Iterator priorIterator = priorSort.iterator();

    for (ColumnWithDirection columnWithDirection : currentSort) {
      if (!priorIterator.hasNext() || !columnWithDirection.equals(priorIterator.next())) {
        return false;
      }
    }

    return true;
  }
}