All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.flink.table.runtime.outerJoinRunners.scala Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.flink.table.runtime

import java.lang.{Boolean => JBool}

import org.apache.flink.api.common.functions.util.FunctionUtils
import org.apache.flink.api.common.functions.{JoinFunction, RichFlatJoinFunction}
import org.apache.flink.api.common.typeinfo.TypeInformation
import org.apache.flink.api.java.typeutils.ResultTypeQueryable
import org.apache.flink.configuration.Configuration
import org.apache.flink.table.codegen.Compiler
import org.apache.flink.table.util.Logging
import org.apache.flink.types.Row
import org.apache.flink.util.Collector

abstract class OuterJoinRunner(
    name: String,
    code: String,
    @transient var returnType: TypeInformation[Row])
  extends RichFlatJoinFunction[Row, Row, Row]
  with ResultTypeQueryable[Row]
  with Compiler[JoinFunction[Row, Row, JBool]]
  with Logging {

  protected var function: JoinFunction[Row, Row, JBool] = null

  override def open(parameters: Configuration): Unit = {
    LOG.debug(s"Compiling FlatJoinFunction: $name \n\n Code:\n$code")
    val clazz = compile(getRuntimeContext.getUserCodeClassLoader, name, code)
    LOG.debug("Instantiating FlatJoinFunction.")
    function = clazz.newInstance()
    FunctionUtils.setFunctionRuntimeContext(function, getRuntimeContext)
    FunctionUtils.openFunction(function, parameters)
  }

  override def getProducedType: TypeInformation[Row] = returnType

  override def close(): Unit = {
    FunctionUtils.closeFunction(function)
  }
}

/**
  * Emits left outer join pairs of left and right rows.
  * Left rows are always preserved if no matching right row is found (predicate evaluates to false
  * or right input row is null).
  */
class LeftOuterJoinRunner(
    name: String,
    code: String,
    returnType: TypeInformation[Row])
  extends OuterJoinRunner(name, code, returnType) {

  val outRow = new Row(3)

  override final def join(leftWithCnt: Row, right: Row, out: Collector[Row]): Unit = {

    val left: Row = leftWithCnt.getField(0).asInstanceOf[Row]
    val leftCnt = leftWithCnt.getField(1)

    outRow.setField(0, left)
    outRow.setField(2, leftCnt)

    if (right == null) {
      // right input row is null. Emit pair with null as right row
      outRow.setField(1, null)
    } else {
      // evaluate predicate.
      if (function.join(left, right)) {
        // emit pair with right row
        outRow.setField(1, right)
      } else {
        // emit pair with null as right row
        outRow.setField(1, null)
      }
    }
    out.collect(outRow)

  }
}

/**
  * Emits right outer join pairs of left and right rows.
  * Right rows are always preserved if no matching left row is found (predicate evaluates to false
  * or left input row is null).
  */
class RightOuterJoinRunner(
  name: String,
  code: String,
  returnType: TypeInformation[Row])
  extends OuterJoinRunner(name, code, returnType) {

  val outRow = new Row(3)

  override final def join(left: Row, rightWithCnt: Row, out: Collector[Row]): Unit = {

    val right: Row = rightWithCnt.getField(0).asInstanceOf[Row]
    val rightCnt = rightWithCnt.getField(1)

    outRow.setField(1, right)
    outRow.setField(2, rightCnt)

    if (left == null) {
      // left input row is null. Emit pair with null as left row
      outRow.setField(0, null)
    } else {
      // evaluate predicate.
      if (function.join(left, right)) {
        outRow.setField(0, left)
      } else {
        outRow.setField(0, null)
      }
    }
    out.collect(outRow)
  }
}

/**
  * Emits full outer join pairs of left and right rows.
  * Left and right rows are always preserved if no matching right row is found (predicate evaluates
  * to false or left or right input row is null).
  */
class FullOuterJoinRunner(
  name: String,
  code: String,
  returnType: TypeInformation[Row])
  extends OuterJoinRunner(name, code, returnType) {

  val outRow = new Row(4)

  override final def join(leftWithCnt: Row, rightWithCnt: Row, out: Collector[Row]): Unit = {

    if (leftWithCnt == null) {
      // left row is null. Emit join pair with null as left row.
      val right: Row = rightWithCnt.getField(0).asInstanceOf[Row]
      val rightCnt = rightWithCnt.getField(1)

      outRow.setField(0, null)
      outRow.setField(1, right)
      outRow.setField(2, null)
      outRow.setField(3, rightCnt)
      out.collect(outRow)
    } else if (rightWithCnt == null) {
      // right row is null. Emit join pair with null as right row.
      val left: Row = leftWithCnt.getField(0).asInstanceOf[Row]
      val leftCnt = leftWithCnt.getField(1)

      outRow.setField(0, left)
      outRow.setField(1, null)
      outRow.setField(2, leftCnt)
      outRow.setField(3, null)
      out.collect(outRow)
    } else {
      // both input rows are not null. Evaluate predicate.
      val left: Row = leftWithCnt.getField(0).asInstanceOf[Row]
      val leftCnt = leftWithCnt.getField(1)
      val right: Row = rightWithCnt.getField(0).asInstanceOf[Row]
      val rightCnt = rightWithCnt.getField(1)

      if (function.join(left, right)) {
        // predicate was true. Set rows in join pair
        outRow.setField(0, left)
        outRow.setField(1, right)
        outRow.setField(2, leftCnt)
        outRow.setField(3, rightCnt)
        out.collect(outRow)
      } else {
        // predicate was false. Emit two join pairs to preserve both input rows.
        // emit pair with left row and null as right row
        outRow.setField(0, left)
        outRow.setField(1, null)
        outRow.setField(2, leftCnt)
        outRow.setField(3, null)
        out.collect(outRow)

        // emit pair with right row and null as left row
        outRow.setField(0, null)
        outRow.setField(1, right)
        outRow.setField(2, null)
        outRow.setField(3, rightCnt)
        out.collect(outRow)
      }
    }
  }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy