com.yahoo.sketches.pig.frequencies.DataToFrequentStringsSketch Maven / Gradle / Ivy
/*
* Copyright 2016, Yahoo! Inc.
* Licensed under the terms of the Apache License 2.0. See LICENSE file at the project root for terms.
*/
package com.yahoo.sketches.pig.frequencies;
import org.apache.pig.Algebraic;
import com.yahoo.sketches.ArrayOfStringsSerDe;
/**
* This UDF creates a FrequentItemsSketch<String> from raw data.
* It supports all three ways: exec(), Accumulator and Algebraic.
*/
public class DataToFrequentStringsSketch extends DataToFrequentItemsSketch implements Algebraic {
/**
* Constructor
* @param sketchSize String representation of sketch size
*/
public DataToFrequentStringsSketch(final String sketchSize) {
super(Integer.parseInt(sketchSize), new ArrayOfStringsSerDe());
}
@Override
public String getInitial() {
return Initial.class.getName();
}
@Override
public String getIntermed() {
return IntermediateFinal.class.getName();
}
@Override
public String getFinal() {
return IntermediateFinal.class.getName();
}
public static class Initial extends AlgebraicInitial {
/**
* Constructor for the initial pass of an Algebraic function. This will be passed the same
* constructor arguments as the original UDF.
* @param sketchSize String representation of sketch size
*/
public Initial(final String sketchSize) {}
/**
* Default constructor to make pig validation happy
*/
public Initial() {}
}
public static class IntermediateFinal extends DataToFrequentItemsSketchAlgebraicIntermediateFinal {
/**
* Constructor for the intermediate and final passes of an Algebraic function. This will be
* passed the same constructor arguments as the original UDF.
* @param sketchSize String representation of sketch size
*/
public IntermediateFinal(final String sketchSize) {
super(Integer.parseInt(sketchSize), new ArrayOfStringsSerDe());
}
/**
* Default constructor to make pig validation happy.
*/
public IntermediateFinal() {}
}
}