com.twitter.scalding.Operations.scala Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of scalding-core_2.11 Show documentation
scalding-core
There is a newer version: 0.16.1-RC3
/*
Copyright 2012 Twitter, Inc.

Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at

http://www.apache.org/licenses/LICENSE-2.0

Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package com.twitter.scalding {

  import cascading.operation._
  import cascading.tuple._
  import cascading.flow._
  import cascading.pipe.assembly.{ AggregateBy, AggregateByProps }
  import com.twitter.chill.MeatLocker
  import scala.collection.JavaConverters._

  import com.twitter.algebird.{ Semigroup, StatefulSummer, SummingWithHitsCache, AdaptiveCache }
  import com.twitter.scalding.mathematics.Poisson
  import serialization.Externalizer
  import scala.util.Try

  trait ScaldingPrepare[C] extends Operation[C] {
    abstract override def prepare(flowProcess: FlowProcess[_], operationCall: OperationCall[C]): Unit = {
      RuntimeStats.addFlowProcess(flowProcess)
      super.prepare(flowProcess, operationCall)
    }
  }

  class FlatMapFunction[S, T](@transient fn: S => TraversableOnce[T], fields: Fields,
    conv: TupleConverter[S], set: TupleSetter[T])
    extends BaseOperation[Any](fields) with Function[Any] with ScaldingPrepare[Any] {
    val lockedFn = Externalizer(fn)

    /**
     * Private helper to get at the function that this FlatMapFunction wraps
     */
    private[scalding] def getFunction = fn

    def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[Any]): Unit = {
      lockedFn.get(conv(functionCall.getArguments)).foreach { arg: T =>
        val this_tup = set(arg)
        functionCall.getOutputCollector.add(this_tup)
      }
    }
  }

  class MapFunction[S, T](@transient fn: S => T, fields: Fields,
    conv: TupleConverter[S], set: TupleSetter[T])
    extends BaseOperation[Any](fields) with Function[Any] with ScaldingPrepare[Any] {
    val lockedFn = Externalizer(fn)
    def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[Any]): Unit = {
      val res = lockedFn.get(conv(functionCall.getArguments))
      functionCall.getOutputCollector.add(set(res))
    }
  }

  /*
    The IdentityFunction puts empty nodes in the cascading graph. We use these to nudge the cascading planner
    in some edge cases.
  */
  object IdentityFunction
    extends BaseOperation[Any](Fields.ALL) with Function[Any] with ScaldingPrepare[Any] {
    def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[Any]): Unit = {
      functionCall.getOutputCollector.add(functionCall.getArguments)
    }
  }

  class CleanupIdentityFunction(@transient fn: () => Unit)
    extends BaseOperation[Any](Fields.ALL) with Function[Any] with ScaldingPrepare[Any] {

    val lockedEf = Externalizer(fn)

    def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[Any]): Unit = {
      functionCall.getOutputCollector.add(functionCall.getArguments)
    }
    override def cleanup(flowProcess: FlowProcess[_], operationCall: OperationCall[Any]): Unit = {
      Try.apply(lockedEf.get).foreach(_())
    }
  }

  class CollectFunction[S, T](@transient fn: PartialFunction[S, T], fields: Fields,
    conv: TupleConverter[S], set: TupleSetter[T])
    extends BaseOperation[Any](fields) with Function[Any] with ScaldingPrepare[Any] {

    val lockedFn = Externalizer(fn)

    def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[Any]): Unit = {
      val partialfn = lockedFn.get
      val args = conv(functionCall.getArguments)

      if (partialfn.isDefinedAt(args)) {
        functionCall.getOutputCollector.add(set(partialfn(args)))
      }
    }
  }

  /**
   * An implementation of map-side combining which is appropriate for associative and commutative functions
   * If a cacheSize is given, it is used, else we query
   * the config for cascading.aggregateby.threshold (standard cascading param for an equivalent case)
   * else we use a default value of 100,000
   *
   * This keeps a cache of keys up to the cache-size, summing values as keys collide
   * On eviction, or completion of this Operation, the key-value pairs are put into outputCollector.
   *
   * This NEVER spills to disk and generally never be a performance penalty. If you have
   * poor locality in the keys, you just don't get any benefit but little added cost.
   *
   * Note this means that you may still have repeated keys in the output even on a single mapper
   * since the key space may be so large that you can't fit all of them in the cache at the same
   * time.
   *
   * You can use this with the Fields-API by doing:
   * {{{
   *  val msr = new MapsideReduce(Semigroup.from(fn), 'key, 'value, None)
   *  // MUST map onto the same key,value space (may be multiple fields)
   *  val mapSideReduced = pipe.eachTo(('key, 'value) -> ('key, 'value)) { _ => msr }
   * }}}
   * That said, this is equivalent to AggregateBy, and the only value is that it is much simpler than AggregateBy.
   * AggregateBy assumes several parallel reductions are happening, and thus has many loops, and array lookups
   * to deal with that.  Since this does many fewer allocations, and has a smaller code-path it may be faster for
   * the typed-API.
   */
  object MapsideReduce {
    val COUNTER_GROUP = "MapsideReduce"
  }

  class MapsideReduce[V](
    @transient commutativeSemigroup: Semigroup[V],
    keyFields: Fields, valueFields: Fields,
    cacheSize: Option[Int])(implicit conv: TupleConverter[V], set: TupleSetter[V])
    extends BaseOperation[MapsideCache[Tuple, V]](Fields.join(keyFields, valueFields))
    with Function[MapsideCache[Tuple, V]]
    with ScaldingPrepare[MapsideCache[Tuple, V]] {

    val boxedSemigroup = Externalizer(commutativeSemigroup)

    override def prepare(flowProcess: FlowProcess[_], operationCall: OperationCall[MapsideCache[Tuple, V]]): Unit = {
      //Set up the context:
      implicit val sg: Semigroup[V] = boxedSemigroup.get
      val cache = MapsideCache[Tuple, V](cacheSize, flowProcess)
      operationCall.setContext(cache)
    }

    @inline
    private def add(evicted: Option[Map[Tuple, V]], functionCall: FunctionCall[MapsideCache[Tuple, V]]): Unit = {
      // Use iterator and while for optimal performance (avoid closures/fn calls)
      if (evicted.isDefined) {
        // Don't use pattern matching in performance-critical code
        @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
        val it = evicted.get.iterator
        val tecol = functionCall.getOutputCollector
        while (it.hasNext) {
          val (key, value) = it.next
          // Safe to mutate this key as it is evicted from the map
          key.addAll(set(value))
          tecol.add(key)
        }
      }
    }

    override def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[MapsideCache[Tuple, V]]): Unit = {
      val cache = functionCall.getContext
      val keyValueTE = functionCall.getArguments
      // Have to keep a copy of the key tuple because cascading will modify it
      val key = keyValueTE.selectEntry(keyFields).getTupleCopy
      val value = conv(keyValueTE.selectEntry(valueFields))
      val evicted = cache.put(key, value)
      add(evicted, functionCall)
    }

    override def flush(flowProcess: FlowProcess[_], operationCall: OperationCall[MapsideCache[Tuple, V]]): Unit = {
      // Docs say it is safe to do this cast:
      // http://docs.cascading.org/cascading/2.1/javadoc/cascading/operation/Operation.html#flush(cascading.flow.FlowProcess, cascading.operation.OperationCall)
      val functionCall = operationCall.asInstanceOf[FunctionCall[MapsideCache[Tuple, V]]]
      val cache = functionCall.getContext
      add(cache.flush, functionCall)
    }

    override def cleanup(flowProcess: FlowProcess[_], operationCall: OperationCall[MapsideCache[Tuple, V]]): Unit = {
      // The cache may be large, but super sure we drop any reference to it ASAP
      // probably overly defensive, but it's super cheap.
      operationCall.setContext(null)
    }
  }

  class TypedMapsideReduce[K, V](
    @transient fn: TupleEntry => TraversableOnce[(K, V)],
    @transient commutativeSemigroup: Semigroup[V],
    sourceFields: Fields,
    keyFields: Fields, valueFields: Fields,
    cacheSize: Option[Int])(implicit setKV: TupleSetter[(K, V)])
    extends BaseOperation[MapsideCache[K, V]](Fields.join(keyFields, valueFields))
    with Function[MapsideCache[K, V]]
    with ScaldingPrepare[MapsideCache[K, V]] {

    val boxedSemigroup = Externalizer(commutativeSemigroup)
    val lockedFn = Externalizer(fn)

    override def prepare(flowProcess: FlowProcess[_], operationCall: OperationCall[MapsideCache[K, V]]): Unit = {
      //Set up the context:
      implicit val sg: Semigroup[V] = boxedSemigroup.get
      val cache = MapsideCache[K, V](cacheSize, flowProcess)
      operationCall.setContext(cache)
    }

    // Don't use pattern matching in a performance-critical section
    @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
    @inline
    private def add(evicted: Option[Map[K, V]], functionCall: FunctionCall[MapsideCache[K, V]]): Unit = {
      // Use iterator and while for optimal performance (avoid closures/fn calls)
      if (evicted.isDefined) {
        val it = evicted.get.iterator
        val tecol = functionCall.getOutputCollector
        while (it.hasNext) {
          val (key, value) = it.next
          // Safe to mutate this key as it is evicted from the map
          tecol.add(setKV(key, value))
        }
      }
    }

    import scala.collection.mutable.{ Map => MMap }

    private[this] class CollectionBackedMap[K, V](val backingMap: MMap[K, V]) extends Map[K, V] with java.io.Serializable {
      def get(key: K) = backingMap.get(key)

      def iterator = backingMap.iterator

      def +[B1 >: V](kv: (K, B1)) = backingMap.toMap + kv

      def -(key: K) = backingMap.toMap - key
    }

    // Don't use pattern matching in a performance-critical section
    @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
    private[this] def mergeTraversableOnce[K, V: Semigroup](items: TraversableOnce[(K, V)]): Map[K, V] = {
      val mutable = scala.collection.mutable.OpenHashMap[K, V]() // Scala's OpenHashMap seems faster than Java and Scala's HashMap Impl's
      val innerIter = items.toIterator
      while (innerIter.hasNext) {
        val (k, v) = innerIter.next
        val oldVOpt: Option[V] = mutable.get(k)
        // sorry for the micro optimization here: avoiding a closure
        val newV: V = if (oldVOpt.isEmpty) v else Semigroup.plus(oldVOpt.get, v)
        mutable.update(k, newV)
      }
      new CollectionBackedMap(mutable)
    }

    override def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[MapsideCache[K, V]]): Unit = {
      val cache = functionCall.getContext
      implicit val sg = boxedSemigroup.get
      val res: Map[K, V] = mergeTraversableOnce(lockedFn.get(functionCall.getArguments))
      val evicted = cache.putAll(res)
      add(evicted, functionCall)
    }

    override def flush(flowProcess: FlowProcess[_], operationCall: OperationCall[MapsideCache[K, V]]): Unit = {
      // Docs say it is safe to do this cast:
      // http://docs.cascading.org/cascading/2.1/javadoc/cascading/operation/Operation.html#flush(cascading.flow.FlowProcess, cascading.operation.OperationCall)
      val functionCall = operationCall.asInstanceOf[FunctionCall[MapsideCache[K, V]]]
      val cache = functionCall.getContext
      add(cache.flush, functionCall)
    }

    override def cleanup(flowProcess: FlowProcess[_], operationCall: OperationCall[MapsideCache[K, V]]): Unit = {
      // The cache may be large, but super sure we drop any reference to it ASAP
      // probably overly defensive, but it's super cheap.
      operationCall.setContext(null)
    }
  }

  sealed trait MapsideCache[K, V] {
    def flush: Option[Map[K, V]]
    def put(key: K, value: V): Option[Map[K, V]]

    def putAll(key: Map[K, V]): Option[Map[K, V]]
  }

  object MapsideCache {
    val ADAPTIVE_CACHE_KEY = "scalding.mapsidecache.adaptive"
    val DEFAULT_CACHE_SIZE = 100000
    val CASCADING2_SIZE_CONFIG_KEY = Config.CascadingAggregateByThreshold
    val CASCADING3_SIZE_CONFIG_KEY = AggregateByProps.AGGREGATE_BY_CAPACITY

    def getCacheSize(fp: FlowProcess[_]): Int = {
      def getInt(k: String): Option[Int] = Option(fp.getStringProperty(k)).filterNot(_.isEmpty).map(_.toInt)
      val cascading2Property = getInt(CASCADING2_SIZE_CONFIG_KEY)
      val cascading3Property = getInt(CASCADING3_SIZE_CONFIG_KEY)
      // we support both old and new properties for backward compatibility
      // and pick the max of the two, when both exist
      val sizeFromProperty = (cascading2Property, cascading3Property) match {
        case (Some(a), Some(b)) => Some(Ordering[Int].max(a, b))
        case (None, None) => None
        case (Some(a), _) => Some(a)
        case (_, Some(b)) => Some(b)
      }
      sizeFromProperty.getOrElse(DEFAULT_CACHE_SIZE)
    }

    def apply[K, V: Semigroup](cacheSize: Option[Int], flowProcess: FlowProcess[_]): MapsideCache[K, V] = {
      val size = cacheSize.getOrElse{ getCacheSize(flowProcess) }
      val adaptive = Option(flowProcess.getStringProperty(ADAPTIVE_CACHE_KEY)).isDefined
      if (adaptive)
        new AdaptiveMapsideCache(flowProcess, new AdaptiveCache(size))
      else
        new SummingMapsideCache(flowProcess, new SummingWithHitsCache(size))
    }
  }

  class SummingMapsideCache[K, V](flowProcess: FlowProcess[_], summingCache: SummingWithHitsCache[K, V])
    extends MapsideCache[K, V] {
    private[this] val misses = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "misses"))
    private[this] val hits = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "hits"))
    private[this] val evictions = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "evictions"))

    def flush = summingCache.flush

    // Don't use pattern matching in performance-critical code
    @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
    def put(key: K, value: V): Option[Map[K, V]] = {
      val (curHits, evicted) = summingCache.putWithHits(Map(key -> value))
      misses.increment(1 - curHits)
      hits.increment(curHits)

      if (evicted.isDefined)
        evictions.increment(evicted.get.size)
      evicted
    }

    // Don't use pattern matching in a performance-critical section
    @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
    def putAll(kvs: Map[K, V]): Option[Map[K, V]] = {
      val (curHits, evicted) = summingCache.putWithHits(kvs)
      misses.increment(kvs.size - curHits)
      hits.increment(curHits)

      if (evicted.isDefined)
        evictions.increment(evicted.get.size)
      evicted
    }
  }

  class AdaptiveMapsideCache[K, V](flowProcess: FlowProcess[_], adaptiveCache: AdaptiveCache[K, V])
    extends MapsideCache[K, V] {
    private[this] val misses = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "misses"))
    private[this] val hits = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "hits"))
    private[this] val capacity = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "capacity"))
    private[this] val sentinel = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "sentinel"))
    private[this] val evictions = CounterImpl(flowProcess, StatKey(MapsideReduce.COUNTER_GROUP, "evictions"))

    def flush = adaptiveCache.flush

    // Don't use pattern matching in performance-critical code
    @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
    def put(key: K, value: V) = {
      val (stats, evicted) = adaptiveCache.putWithStats(Map(key -> value))
      misses.increment(1 - stats.hits)
      hits.increment(stats.hits)
      capacity.increment(stats.cacheGrowth)
      sentinel.increment(stats.sentinelGrowth)

      if (evicted.isDefined)
        evictions.increment(evicted.get.size)

      evicted

    }

    // Don't use pattern matching in a performance-critical section
    @SuppressWarnings(Array("org.brianmckenna.wartremover.warts.OptionPartial"))
    def putAll(kvs: Map[K, V]): Option[Map[K, V]] = {
      val (stats, evicted) = adaptiveCache.putWithStats(kvs)
      misses.increment(kvs.size - stats.hits)
      hits.increment(stats.hits)
      capacity.increment(stats.cacheGrowth)
      sentinel.increment(stats.sentinelGrowth)

      if (evicted.isDefined)
        evictions.increment(evicted.get.size)

      evicted
    }
  }

  /*
   * BaseOperation with support for context
   */
  abstract class SideEffectBaseOperation[C](
    @transient bf: => C, // begin function returns a context
    @transient ef: C => Unit, // end function to clean up context object
    fields: Fields) extends BaseOperation[C](fields) with ScaldingPrepare[C] {
    val lockedBf = Externalizer(() => bf)
    val lockedEf = Externalizer(ef)
    override def prepare(flowProcess: FlowProcess[_], operationCall: OperationCall[C]): Unit = {
      operationCall.setContext(lockedBf.get.apply)
    }

    override def cleanup(flowProcess: FlowProcess[_], operationCall: OperationCall[C]): Unit = {
      lockedEf.get(operationCall.getContext)
    }
  }

  /*
   * A map function that allows state object to be set up and tear down.
   */
  class SideEffectMapFunction[S, C, T](
    bf: => C, // begin function returns a context
    @transient fn: (C, S) => T, // function that takes a context and a tuple and generate a new tuple
    ef: C => Unit, // end function to clean up context object
    fields: Fields,
    conv: TupleConverter[S],
    set: TupleSetter[T]) extends SideEffectBaseOperation[C](bf, ef, fields) with Function[C] {
    val lockedFn = Externalizer(fn)

    override def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[C]): Unit = {
      val context = functionCall.getContext
      val s = conv(functionCall.getArguments)
      val res = lockedFn.get(context, s)
      functionCall.getOutputCollector.add(set(res))
    }
  }

  /*
   * A flatmap function that allows state object to be set up and tear down.
   */
  class SideEffectFlatMapFunction[S, C, T](
    bf: => C, // begin function returns a context
    @transient fn: (C, S) => TraversableOnce[T], // function that takes a context and a tuple, returns TraversableOnce of T
    ef: C => Unit, // end function to clean up context object
    fields: Fields,
    conv: TupleConverter[S],
    set: TupleSetter[T]) extends SideEffectBaseOperation[C](bf, ef, fields) with Function[C] {
    val lockedFn = Externalizer(fn)

    override def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[C]): Unit = {
      val context = functionCall.getContext
      val s = conv(functionCall.getArguments)
      lockedFn.get(context, s) foreach { t => functionCall.getOutputCollector.add(set(t)) }
    }
  }

  class FilterFunction[T](@transient fn: T => Boolean, conv: TupleConverter[T])
    extends BaseOperation[Any] with Filter[Any] with ScaldingPrepare[Any] {
    val lockedFn = Externalizer(fn)

    def isRemove(flowProcess: FlowProcess[_], filterCall: FilterCall[Any]) = {
      !lockedFn.get(conv(filterCall.getArguments))
    }
  }

  // All the following are operations for use in GroupBuilder

  class FoldAggregator[T, X](@transient fn: (X, T) => X, @transient init: X, fields: Fields,
    conv: TupleConverter[T], set: TupleSetter[X])
    extends BaseOperation[X](fields) with Aggregator[X] with ScaldingPrepare[X] {
    val lockedFn = Externalizer(fn)
    private val lockedInit = MeatLocker(init)
    def initCopy = lockedInit.copy

    def start(flowProcess: FlowProcess[_], call: AggregatorCall[X]): Unit = {
      call.setContext(initCopy)
    }

    def aggregate(flowProcess: FlowProcess[_], call: AggregatorCall[X]): Unit = {
      val left = call.getContext
      val right = conv(call.getArguments)
      call.setContext(lockedFn.get(left, right))
    }

    def complete(flowProcess: FlowProcess[_], call: AggregatorCall[X]): Unit = {
      emit(flowProcess, call)
    }

    def emit(flowProcess: FlowProcess[_], call: AggregatorCall[X]): Unit = {
      call.getOutputCollector.add(set(call.getContext))
    }
  }

  /*
   * fields are the declared fields of this aggregator
   */
  class MRMAggregator[T, X, U](
    @transient inputFsmf: T => X,
    @transient inputRfn: (X, X) => X,
    @transient inputMrfn: X => U,
    fields: Fields, conv: TupleConverter[T], set: TupleSetter[U])
    extends BaseOperation[Tuple](fields) with Aggregator[Tuple] with ScaldingPrepare[Tuple] {
    val fsmf = Externalizer(inputFsmf)
    val rfn = Externalizer(inputRfn)
    val mrfn = Externalizer(inputMrfn)

    // The context is a singleton Tuple, which is mutable so
    // we don't have to allocate at every step of the loop:
    def start(flowProcess: FlowProcess[_], call: AggregatorCall[Tuple]): Unit = {
      call.setContext(null)
    }

    def extractArgument(call: AggregatorCall[Tuple]): X = fsmf.get(conv(call.getArguments))

    def aggregate(flowProcess: FlowProcess[_], call: AggregatorCall[Tuple]): Unit = {
      val arg = extractArgument(call)
      val ctx = call.getContext
      if (ctx == null) {
        // Initialize the context, this is the only allocation done by this loop.
        val newCtx = Tuple.size(1)
        newCtx.set(0, arg.asInstanceOf[AnyRef])
        call.setContext(newCtx)
      } else {
        // Mutate the context:
        val oldValue = ctx.getObject(0).asInstanceOf[X]
        val newValue = rfn.get(oldValue, arg)
        ctx.set(0, newValue.asInstanceOf[AnyRef])
      }
    }

    def complete(flowProcess: FlowProcess[_], call: AggregatorCall[Tuple]): Unit = {
      val ctx = call.getContext
      if (null != ctx) {
        val lastValue = ctx.getObject(0).asInstanceOf[X]
        // Make sure to drop the reference to the lastValue as soon as possible (it may be big)
        call.setContext(null)
        call.getOutputCollector.add(set(mrfn.get(lastValue)))
      } else {
        throw new Exception("MRMAggregator completed without any args")
      }
    }
  }

  /**
   * This handles the mapReduceMap work on the map-side of the operation.  The code below
   * attempts to be optimal with respect to memory allocations and performance, not functional
   * style purity.
   */
  abstract class FoldFunctor[X](fields: Fields) extends AggregateBy.Functor {

    // Extend these three methods:
    def first(args: TupleEntry): X
    def subsequent(oldValue: X, newArgs: TupleEntry): X
    def finish(lastValue: X): Tuple

    override final def getDeclaredFields = fields

    /*
     * It's important to keep all state in the context as Cascading seems to
     * reuse these objects, so any per instance state might give unexpected
     * results.
     */
    override final def aggregate(flowProcess: FlowProcess[_], args: TupleEntry, context: Tuple) = {
      var nextContext: Tuple = null
      val newContextObj = if (context == null) {
        // First call, make a new mutable tuple to reduce allocations:
        nextContext = Tuple.size(1)
        first(args)
      } else {
        //We are updating
        val oldValue = context.getObject(0).asInstanceOf[X]
        nextContext = context
        subsequent(oldValue, args)
      }
      nextContext.set(0, newContextObj.asInstanceOf[AnyRef])
      //Return context for reuse next time:
      nextContext
    }

    override final def complete(flowProcess: FlowProcess[_], context: Tuple) = {
      if (context == null) {
        throw new Exception("FoldFunctor completed with any aggregate calls")
      } else {
        val res = context.getObject(0).asInstanceOf[X]
        // Make sure we remove the ref to the context ASAP:
        context.set(0, null)
        finish(res)
      }
    }
  }

  /**
   * This handles the mapReduceMap work on the map-side of the operation.  The code below
   * attempts to be optimal with respect to memory allocations and performance, not functional
   * style purity.
   */
  class MRMFunctor[T, X](
    @transient inputMrfn: T => X,
    @transient inputRfn: (X, X) => X,
    fields: Fields,
    conv: TupleConverter[T], set: TupleSetter[X])
    extends FoldFunctor[X](fields) {

    val mrfn = Externalizer(inputMrfn)
    val rfn = Externalizer(inputRfn)

    override def first(args: TupleEntry): X = mrfn.get(conv(args))
    override def subsequent(oldValue: X, newArgs: TupleEntry) = {
      val right = mrfn.get(conv(newArgs))
      rfn.get(oldValue, right)
    }
    override def finish(lastValue: X) = set(lastValue)
  }

  /**
   * MapReduceMapBy Class
   */
  class MRMBy[T, X, U](arguments: Fields,
    middleFields: Fields,
    declaredFields: Fields,
    mfn: T => X,
    rfn: (X, X) => X,
    mfn2: X => U,
    startConv: TupleConverter[T],
    midSet: TupleSetter[X],
    midConv: TupleConverter[X],
    endSet: TupleSetter[U]) extends AggregateBy(
    arguments,
    new MRMFunctor[T, X](mfn, rfn, middleFields, startConv, midSet),
    new MRMAggregator[X, X, U](args => args, rfn, mfn2, declaredFields, midConv, endSet))

  class BufferOp[I, T, X](
    @transient init: I,
    @transient inputIterfn: (I, Iterator[T]) => TraversableOnce[X],
    fields: Fields, conv: TupleConverter[T], set: TupleSetter[X])
    extends BaseOperation[Any](fields) with Buffer[Any] with ScaldingPrepare[Any] {
    val iterfn = Externalizer(inputIterfn)
    private val lockedInit = MeatLocker(init)
    def initCopy = lockedInit.copy

    def operate(flowProcess: FlowProcess[_], call: BufferCall[Any]): Unit = {
      val oc = call.getOutputCollector
      val in = call.getArgumentsIterator.asScala.map { entry => conv(entry) }
      iterfn.get(initCopy, in).foreach { x => oc.add(set(x)) }
    }
  }

  /*
   * A buffer that allows state object to be set up and tear down.
   */
  class SideEffectBufferOp[I, T, C, X](
    @transient init: I,
    bf: => C, // begin function returns a context
    @transient inputIterfn: (I, C, Iterator[T]) => TraversableOnce[X],
    ef: C => Unit, // end function to clean up context object
    fields: Fields,
    conv: TupleConverter[T],
    set: TupleSetter[X]) extends SideEffectBaseOperation[C](bf, ef, fields) with Buffer[C] {
    val iterfn = Externalizer(inputIterfn)
    private val lockedInit = MeatLocker(init)
    def initCopy = lockedInit.copy

    def operate(flowProcess: FlowProcess[_], call: BufferCall[C]): Unit = {
      val context = call.getContext
      val oc = call.getOutputCollector
      val in = call.getArgumentsIterator.asScala.map { entry => conv(entry) }
      iterfn.get(initCopy, context, in).foreach { x => oc.add(set(x)) }
    }
  }

  class SampleWithReplacement(frac: Double, val seed: Int = new java.util.Random().nextInt) extends BaseOperation[Poisson]()
    with Function[Poisson] with ScaldingPrepare[Poisson] {
    override def prepare(flowProcess: FlowProcess[_], operationCall: OperationCall[Poisson]): Unit = {
      super.prepare(flowProcess, operationCall)
      val p = new Poisson(frac, seed)
      operationCall.setContext(p);
    }

    def operate(flowProcess: FlowProcess[_], functionCall: FunctionCall[Poisson]): Unit = {
      val r = functionCall.getContext.nextInt
      for (i <- 0 until r)
        functionCall.getOutputCollector().add(Tuple.NULL)
    }
  }

  /** In the typed API every reduce operation is handled by this Buffer */
  class TypedBufferOp[K, V, U](
    conv: TupleConverter[K],
    convV: TupleConverter[V],
    @transient reduceFn: (K, Iterator[V]) => Iterator[U],
    valueField: Fields)
    extends BaseOperation[Any](valueField) with Buffer[Any] with ScaldingPrepare[Any] {
    val reduceFnSer = Externalizer(reduceFn)

    def operate(flowProcess: FlowProcess[_], call: BufferCall[Any]): Unit = {
      val oc = call.getOutputCollector
      val key = conv(call.getGroup)
      val values = call.getArgumentsIterator
        .asScala
        .map(convV(_))

      // Avoiding a lambda here
      val resIter = reduceFnSer.get(key, values)
      while (resIter.hasNext) {
        val tup = Tuple.size(1)
        tup.set(0, resIter.next)
        oc.add(tup)
      }
    }
  }
}