All Downloads are FREE. Search and download functionalities are using the official Maven repository.

eu.stratosphere.api.common.distributions.SimpleIntegerDistribution Maven / Gradle / Ivy

There is a newer version: 0.5.2-hadoop2
Show newest version
/***********************************************************************************************************************
 * Copyright (C) 2010-2013 by the Stratosphere project (http://stratosphere.eu)
 *
 * Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with
 * the License. You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on
 * an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the
 * specific language governing permissions and limitations under the License.
 **********************************************************************************************************************/
package eu.stratosphere.api.common.distributions;

import java.io.DataInput;
import java.io.DataOutput;
import java.io.IOException;

import eu.stratosphere.types.IntValue;

public class SimpleIntegerDistribution extends SimpleDistribution {
	
	private static final long serialVersionUID = 1L;
	
	
	public SimpleIntegerDistribution() {
		boundaries = new IntValue[0][];
	}
	
	public SimpleIntegerDistribution(int[] bucketBoundaries) {
		if (bucketBoundaries == null) {
			throw new IllegalArgumentException("Bucket boundaries must not be null.");
		}
		if (bucketBoundaries.length == 0) {
			throw new IllegalArgumentException("Bucket boundaries must not be empty.");
		}

		// dimensionality is one in this case
		dim = 1;
		
		// make the array 2-dimensional
		boundaries = packIntegers(bucketBoundaries);
	}
	
	public SimpleIntegerDistribution(IntValue[] bucketBoundaries) {
		if (bucketBoundaries == null) {
			throw new IllegalArgumentException("Bucket boundaries must not be null.");
		}
		if (bucketBoundaries.length == 0) {
			throw new IllegalArgumentException("Bucket boundaries must not be empty.");
		}

		// dimensionality is one in this case
		dim = 1;
		
		// make the array 2-dimensional
		boundaries = new IntValue[bucketBoundaries.length][];
		for (int i = 0; i < bucketBoundaries.length; i++) {
			boundaries[i] = new IntValue[] { bucketBoundaries[i] };
		}
	}
	
	public SimpleIntegerDistribution(IntValue[][] bucketBoundaries) {
		if (bucketBoundaries == null) {
			throw new IllegalArgumentException("Bucket boundaries must not be null.");
		}
		if (bucketBoundaries.length == 0) {
			throw new IllegalArgumentException("Bucket boundaries must not be empty.");
		}

		// dimensionality is one in this case
		dim = bucketBoundaries[0].length;
		
		// check the array
		for (int i = 1; i < bucketBoundaries.length; i++) {
			if (bucketBoundaries[i].length != dim) {
				throw new IllegalArgumentException("All bucket boundaries must have the same dimensionality.");
			}
		}
	}
	
	@Override
	public int getNumberOfFields() {
		return this.dim;
	}

	@Override
	public IntValue[] getBucketBoundary(int bucketNum, int totalNumBuckets) {
		// check validity of arguments
		if(bucketNum < 0) {
			throw new IllegalArgumentException("Requested bucket must be greater than or equal to 0.");
		} else if(bucketNum >= (totalNumBuckets - 1)) {
			throw new IllegalArgumentException("Request bucket must be smaller than the total number of buckets minus 1.");
		}
		if(totalNumBuckets < 1) {
			throw new IllegalArgumentException("Total number of bucket must be larger than 0.");
		}
		
		final int maxNumBuckets = boundaries.length + 1;
		
		// check if max number of buckets is equal to or an even multiple of the requested number of buckets
		if((maxNumBuckets % totalNumBuckets) == 0) {
			// easy case, just use each n-th boundary
			final int n = maxNumBuckets / totalNumBuckets;
			final int bucketId = bucketNum * n + (n -  1); 
			
			return (IntValue[]) boundaries[bucketId];
		} else {
			throw new IllegalArgumentException("Interpolation of bucket boundaries currently not supported. " +
					"Please use an even divider of the maximum possible buckets (here: "+maxNumBuckets+") as totalBuckets.");
			// TODO: might be relaxed if much more boundary records are available than requested
		}
	}

	@Override
	public void write(DataOutput out) throws IOException {
		out.writeInt(this.dim);
		out.writeInt(boundaries.length);
		
		for (int i = 0; i < boundaries.length; i++) {
			for (int d = 0; d < dim; d++) {
				out.writeInt(((IntValue) boundaries[i][d]).getValue());
			}
		}
	}

	@Override
	public void read(DataInput in) throws IOException {
		this.dim = in.readInt();
		final int len = in.readInt();
		
		boundaries = new IntValue[len][];
		
		for (int i = 0; i < len; i++) {
			IntValue[] bucket = new IntValue[dim]; 
			for (int d = 0; d < dim; d++) {
				bucket[d] = new IntValue(in.readInt());
			}
			
			boundaries[i] = bucket;
		}
	}
	
	private static IntValue[][] packIntegers(int[] values) {
		IntValue[][] packed = new IntValue[values.length][];
		for (int i = 0; i < values.length; i++) {
			packed[i] = new IntValue[] { new IntValue(values[i]) };
		}
		
		return packed;
	}
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy