eu.stratosphere.api.common.distributions.SimpleIntegerDistribution Maven / Gradle / Ivy
/***********************************************************************************************************************
* Copyright (C) 2010-2013 by the Stratosphere project (http://stratosphere.eu)
*
* Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
* an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
* specific language governing permissions and limitations under the License.
**********************************************************************************************************************/
package eu.stratosphere.api.common.distributions;
import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;
import eu.stratosphere.types.IntValue;
public class SimpleIntegerDistribution extends SimpleDistribution {
private static final long serialVersionUID = 1L;
public SimpleIntegerDistribution() {
boundaries = new IntValue[0][];
}
public SimpleIntegerDistribution(int[] bucketBoundaries) {
if (bucketBoundaries == null)
throw new IllegalArgumentException("Bucket boundaries must not be null.");
if (bucketBoundaries.length == 0)
throw new IllegalArgumentException("Bucket boundaries must not be empty.");
// dimensionality is one in this case
dim = 1;
// make the array 2-dimensional
boundaries = packIntegers(bucketBoundaries);
}
public SimpleIntegerDistribution(IntValue[] bucketBoundaries) {
if (bucketBoundaries == null)
throw new IllegalArgumentException("Bucket boundaries must not be null.");
if (bucketBoundaries.length == 0)
throw new IllegalArgumentException("Bucket boundaries must not be empty.");
// dimensionality is one in this case
dim = 1;
// make the array 2-dimensional
boundaries = new IntValue[bucketBoundaries.length][];
for (int i = 0; i < bucketBoundaries.length; i++) {
boundaries[i] = new IntValue[] { bucketBoundaries[i] };
}
}
public SimpleIntegerDistribution(IntValue[][] bucketBoundaries) {
if (bucketBoundaries == null)
throw new IllegalArgumentException("Bucket boundaries must not be null.");
if (bucketBoundaries.length == 0)
throw new IllegalArgumentException("Bucket boundaries must not be empty.");
// dimensionality is one in this case
dim = bucketBoundaries[0].length;
// check the array
for (int i = 1; i < bucketBoundaries.length; i++) {
if (bucketBoundaries[i].length != dim) {
throw new IllegalArgumentException("All bucket boundaries must have the same dimensionality.");
}
}
}
@Override
public int getNumberOfFields() {
return this.dim;
}
@Override
public IntValue[] getBucketBoundary(int bucketNum, int totalNumBuckets) {
// check validity of arguments
if(bucketNum < 0) {
throw new IllegalArgumentException("Requested bucket must be greater than or equal to 0.");
} else if(bucketNum >= (totalNumBuckets - 1)) {
throw new IllegalArgumentException("Request bucket must be smaller than the total number of buckets minus 1.");
}
if(totalNumBuckets < 1) {
throw new IllegalArgumentException("Total number of bucket must be larger than 0.");
}
final int maxNumBuckets = boundaries.length + 1;
// check if max number of buckets is equal to or an even multiple of the requested number of buckets
if((maxNumBuckets % totalNumBuckets) == 0) {
// easy case, just use each n-th boundary
final int n = maxNumBuckets / totalNumBuckets;
final int bucketId = bucketNum * n + (n - 1);
return (IntValue[]) boundaries[bucketId];
} else {
throw new IllegalArgumentException("Interpolation of bucket boundaries currently not supported. " +
"Please use an even divider of the maximum possible buckets (here: "+maxNumBuckets+") as totalBuckets.");
// TODO: might be relaxed if much more boundary records are available than requested
}
}
@Override
public void write(DataOutput out) throws IOException {
out.writeInt(this.dim);
out.writeInt(boundaries.length);
for (int i = 0; i < boundaries.length; i++) {
for (int d = 0; d < dim; d++) {
out.writeInt(((IntValue) boundaries[i][d]).getValue());
}
}
}
@Override
public void read(DataInput in) throws IOException {
this.dim = in.readInt();
final int len = in.readInt();
boundaries = new IntValue[len][];
for (int i = 0; i < len; i++) {
IntValue[] bucket = new IntValue[dim];
for (int d = 0; d < dim; d++) {
bucket[d] = new IntValue(in.readInt());
}
boundaries[i] = bucket;
}
}
private static IntValue[][] packIntegers(int[] values) {
IntValue[][] packed = new IntValue[values.length][];
for (int i = 0; i < values.length; i++) {
packed[i] = new IntValue[] { new IntValue(values[i]) };
}
return packed;
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy